# As usual, a bit of setup
import time
import numpy as np
import matplotlib.pyplot as plt
from cs682.data_utils import get_CIFAR10_data
import torch
import torch.nn as nn
import torch.optim as optim
import torchvision.datasets as dset
import torchvision.transforms as T
import torch.nn.functional as F
%matplotlib inline
plt.rcParams['figure.figsize'] = (20.0, 16.0) # set default size of plots
plt.rcParams['image.interpolation'] = 'nearest'
# plt.rcParams['image.cmap'] = 'gray'
# for auto-reloading external modules
# see http://stackoverflow.com/questions/1907993/autoreload-of-modules-in-ipython
%load_ext autoreload
%autoreload 2
def rel_error(x, y):
""" returns relative error """
return np.max(np.abs(x - y) / (np.maximum(1e-8, np.abs(x) + np.abs(y))))
# Load the (preprocessed) CIFAR10 data.
unproccessed_data = get_CIFAR10_data(subtract_mean=False)
for k, v in unproccessed_data.items():
print('%s: ' % k, v.shape)
if (k.startswith("X")):
unproccessed_data[k] = unproccessed_data[k] / 255
X_train: (49000, 3, 32, 32) y_train: (49000,) X_val: (1000, 3, 32, 32) y_val: (1000,) X_test: (1000, 3, 32, 32) y_test: (1000,)
Convert images to black and white for X data and use colored images as Y data
# Set Y data as colored images
data = {}
data["y_train"] = unproccessed_data["X_train"]
data["y_val"] = unproccessed_data["X_val"]
data["y_test"] = unproccessed_data["X_test"]
# Convert X data to B/W
def convertToBW(data):
# Data shape is (N, 3, W, H)
ret = np.zeros(data.shape)
grayscale = 0.299 * data[:, 0, :, :] + 0.587 * data[:, 1, :, :] + 0.114 * data[:, 2, :, :]
ret[:, 0, :, :] = grayscale
ret[:, 1, :, :] = grayscale
ret[:, 2, :, :] = grayscale
return ret
data["X_train"] = convertToBW(unproccessed_data["X_train"]);
data["X_val"] = convertToBW(unproccessed_data["X_val"]);
data["X_test"] = convertToBW(unproccessed_data["X_test"]);
# Create subplots and choose random examples
fig, axs = plt.subplots(5, 2)
idx = np.random.choice(range(data["X_train"].shape[0]), 5)
# Set axis titles
axs[0, 0].title.set_text('X data')
axs[0, 1].title.set_text('Y data')
for i in range(5):
axs[i, 0].imshow(data["X_train"][idx[i]].transpose(1, 2, 0))
axs[i, 1].imshow(data["y_train"][idx[i]].transpose(1, 2, 0))
Test basic model by using 1 FC layer
USE_GPU = True
dtype = torch.float32 # we will be using float throughout this tutorial
if USE_GPU and torch.cuda.is_available():
device = torch.device('cuda')
else:
device = torch.device('cpu')
# Constant to control how frequently we print train loss
print_every = 100
print('using device:', device)
def flatten(x):
N = x.shape[0]
return x.view(N, -1)
using device: cpu
batch_size = 100
print_every = 20
def train(model, optimizer, epochs=1, x_train=data["X_train"], y_train=data["y_train"], criterion=nn.MSELoss()):
"""
Train a model on CIFAR-10 using the PyTorch Module API.
Inputs:
- model: A PyTorch Module giving the model to train.
- optimizer: An Optimizer object we will use to train the model
- epochs: (Optional) A Python integer giving the number of epochs to train for
Returns: Nothing, but prints model accuracies during training.
"""
model = model.to(device=device) # move the model parameters to CPU/GPU\
for e in range(epochs):
model.epochsTrained += 1
print("--- Epoch " + str(e + 1) + " / " + str(epochs) + " - " + str(model.epochsTrained) + " epochs total")
idx = np.random.choice(range(x_train.shape[0]), batch_size)
x_batch = torch.from_numpy(x_train[idx])
y_batch = flatten(torch.from_numpy(y_train[idx]))
for t in range(x_batch.size()[0]):
model.train() # put model to training mode
x = x_batch[t].to(device=device, dtype=dtype)
y = y_batch[t].to(device=device, dtype=dtype)
scores = model(x)
loss = criterion(scores.view(-1), y.view(-1))
# Zero out all of the gradients for the variables which the optimizer
# will update.
optimizer.zero_grad()
# This is the backwards pass: compute the gradient of the loss with
# respect to each parameter of the model.
loss.backward()
# Actually update the parameters of the model using the gradients
# computed by the backwards pass.
optimizer.step()
if t % print_every == 0:
print('Iteration %d, loss = %.4f' % (t, loss.item()))
class BasicNet(nn.Module):
def __init__(self, input_size):
super().__init__()
self.epochsTrained = 0
self.fc = nn.Linear(input_size, input_size)
def forward(self, x):
x = x.view(-1)
scores = self.fc(x)
return scores
learning_rate = 1e-2
model1 = BasicNet(3 * data["X_train"].shape[2] * data["X_train"].shape[3])
optimizer = optim.SGD(model1.parameters(), lr=learning_rate)
train(model1, optimizer, epochs=25)
--- Epoch 1 / 25 - 1 epochs total Iteration 0, loss = 0.1488 Iteration 20, loss = 0.2187 Iteration 40, loss = 0.4903 Iteration 60, loss = 0.6881 Iteration 80, loss = 0.1929 --- Epoch 2 / 25 - 2 epochs total Iteration 0, loss = 0.1037 Iteration 20, loss = 0.0865 Iteration 40, loss = 0.0571 Iteration 60, loss = 0.1310 Iteration 80, loss = 0.1437 --- Epoch 3 / 25 - 3 epochs total Iteration 0, loss = 0.0813 Iteration 20, loss = 0.2574 Iteration 40, loss = 0.0593 Iteration 60, loss = 0.1005 Iteration 80, loss = 0.0389 --- Epoch 4 / 25 - 4 epochs total Iteration 0, loss = 0.0145 Iteration 20, loss = 0.1109 Iteration 40, loss = 0.0839 Iteration 60, loss = 0.0890 Iteration 80, loss = 0.1745 --- Epoch 5 / 25 - 5 epochs total Iteration 0, loss = 0.0308 Iteration 20, loss = 0.0375 Iteration 40, loss = 0.1164 Iteration 60, loss = 0.0505 Iteration 80, loss = 0.0474 --- Epoch 6 / 25 - 6 epochs total Iteration 0, loss = 0.0188 Iteration 20, loss = 0.0376 Iteration 40, loss = 0.0421 Iteration 60, loss = 0.0615 Iteration 80, loss = 0.0739 --- Epoch 7 / 25 - 7 epochs total Iteration 0, loss = 0.0254 Iteration 20, loss = 0.0462 Iteration 40, loss = 0.0866 Iteration 60, loss = 0.0442 Iteration 80, loss = 0.0398 --- Epoch 8 / 25 - 8 epochs total Iteration 0, loss = 0.0476 Iteration 20, loss = 0.0264 Iteration 40, loss = 0.0345 Iteration 60, loss = 0.0511 Iteration 80, loss = 0.0583 --- Epoch 9 / 25 - 9 epochs total Iteration 0, loss = 0.0698 Iteration 20, loss = 0.0462 Iteration 40, loss = 0.0438 Iteration 60, loss = 0.0477 Iteration 80, loss = 0.0605 --- Epoch 10 / 25 - 10 epochs total Iteration 0, loss = 0.0684 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0425 Iteration 60, loss = 0.0418 Iteration 80, loss = 0.0762 --- Epoch 11 / 25 - 11 epochs total Iteration 0, loss = 0.0578 Iteration 20, loss = 0.1219 Iteration 40, loss = 0.0485 Iteration 60, loss = 0.0437 Iteration 80, loss = 0.0725 --- Epoch 12 / 25 - 12 epochs total Iteration 0, loss = 0.1021 Iteration 20, loss = 0.0815 Iteration 40, loss = 0.0393 Iteration 60, loss = 0.0431 Iteration 80, loss = 0.0653 --- Epoch 13 / 25 - 13 epochs total Iteration 0, loss = 0.0581 Iteration 20, loss = 0.1159 Iteration 40, loss = 0.0406 Iteration 60, loss = 0.0558 Iteration 80, loss = 0.0403 --- Epoch 14 / 25 - 14 epochs total Iteration 0, loss = 0.0160 Iteration 20, loss = 0.1339 Iteration 40, loss = 0.0924 Iteration 60, loss = 0.0632 Iteration 80, loss = 0.0237 --- Epoch 15 / 25 - 15 epochs total Iteration 0, loss = 0.0275 Iteration 20, loss = 0.0514 Iteration 40, loss = 0.0580 Iteration 60, loss = 0.0503 Iteration 80, loss = 0.0365 --- Epoch 16 / 25 - 16 epochs total Iteration 0, loss = 0.0645 Iteration 20, loss = 0.0301 Iteration 40, loss = 0.0662 Iteration 60, loss = 0.0634 Iteration 80, loss = 0.0356 --- Epoch 17 / 25 - 17 epochs total Iteration 0, loss = 0.0517 Iteration 20, loss = 0.0566 Iteration 40, loss = 0.0724 Iteration 60, loss = 0.0264 Iteration 80, loss = 0.0671 --- Epoch 18 / 25 - 18 epochs total Iteration 0, loss = 0.0507 Iteration 20, loss = 0.0167 Iteration 40, loss = 0.0526 Iteration 60, loss = 0.0588 Iteration 80, loss = 0.0459 --- Epoch 19 / 25 - 19 epochs total Iteration 0, loss = 0.0549 Iteration 20, loss = 0.0494 Iteration 40, loss = 0.0355 Iteration 60, loss = 0.0258 Iteration 80, loss = 0.0681 --- Epoch 20 / 25 - 20 epochs total Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0552 Iteration 40, loss = 0.0585 Iteration 60, loss = 0.0344 Iteration 80, loss = 0.0662 --- Epoch 21 / 25 - 21 epochs total Iteration 0, loss = 0.0338 Iteration 20, loss = 0.0382 Iteration 40, loss = 0.0445 Iteration 60, loss = 0.0495 Iteration 80, loss = 0.1125 --- Epoch 22 / 25 - 22 epochs total Iteration 0, loss = 0.0905 Iteration 20, loss = 0.0246 Iteration 40, loss = 0.0579 Iteration 60, loss = 0.0920 Iteration 80, loss = 0.0637 --- Epoch 23 / 25 - 23 epochs total Iteration 0, loss = 0.0438 Iteration 20, loss = 0.0504 Iteration 40, loss = 0.0171 Iteration 60, loss = 0.0454 Iteration 80, loss = 0.0272 --- Epoch 24 / 25 - 24 epochs total Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0197 Iteration 40, loss = 0.0689 Iteration 60, loss = 0.0461 Iteration 80, loss = 0.0629 --- Epoch 25 / 25 - 25 epochs total Iteration 0, loss = 0.0734 Iteration 20, loss = 0.0574 Iteration 40, loss = 0.0919 Iteration 60, loss = 0.0485 Iteration 80, loss = 0.0501
def testModel(model, n=10, x_test=data["X_test"], y_test=data["y_test"], criterion=nn.MSELoss()):
model.eval()
# Create subplots and choose random examples
fig, axs = plt.subplots(n, 3)
fig.tight_layout()
fig.set_size_inches(10, 25)
idx = np.random.choice(range(x_test.shape[0]), n)
# Set axis titles
for i in range(n):
sample = x_test[idx[i]]
x_data = torch.from_numpy(sample).to(device=device, dtype=dtype)
predicted = model(x_data)
y_data = y_test[idx[i]]
loss = criterion(predicted.view(3, 32, 32), torch.from_numpy(y_data).to(device=device, dtype=dtype))
axs[i, 0].title.set_text('X data')
axs[i, 1].title.set_text('Loss=' + "{:.9f}".format(loss.item()))
axs[i, 2].title.set_text('Actual')
axs[i, 0].imshow(x_test[idx[i]].transpose(1, 2, 0))
axs[i, 1].imshow(predicted.view(3, 32, 32).detach().numpy().transpose(1, 2, 0))
axs[i, 2].imshow(y_data.transpose(1, 2, 0))
testModel(model1)
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
class BasicConvNet(nn.Module):
def __init__(self):
super().__init__()
self.epochsTrained = 0
self.conv1 = nn.Conv2d(3, 24, kernel_size=3, stride=1, padding=0) # 24 3x3 filters
self.conv2 = nn.Conv2d(24, 24, kernel_size=3, stride=1, padding=0) # 24 3x3 filters
self.conv3 = nn.Conv2d(24, 12, kernel_size=3, stride=1, padding=0) # 12 3x3 filters
self.fc = nn.Linear(8112, 32 * 32 * 3)
def forward(self, x):
x = x.unsqueeze(0)
scores = F.relu(self.conv1(x));
scores = F.relu(self.conv2(scores));
scores = F.relu(self.conv3(scores));
scores = self.fc(scores.view(-1))
return scores
learning_rate = 1e-2
model2 = BasicConvNet()
optimizer = optim.SGD(model2.parameters(), lr=learning_rate)
train(model2, optimizer, epochs=25, criterion=nn.MSELoss())
--- Epoch 1 / 25 - 1 epochs total Iteration 0, loss = 0.3250 Iteration 20, loss = 0.1401 Iteration 40, loss = 0.2926 Iteration 60, loss = 0.3218 Iteration 80, loss = 0.2827 --- Epoch 2 / 25 - 2 epochs total Iteration 0, loss = 0.3426 Iteration 20, loss = 0.1222 Iteration 40, loss = 0.5539 Iteration 60, loss = 0.1707 Iteration 80, loss = 0.3535 --- Epoch 3 / 25 - 3 epochs total Iteration 0, loss = 0.2681 Iteration 20, loss = 0.2246 Iteration 40, loss = 0.3098 Iteration 60, loss = 0.1848 Iteration 80, loss = 0.3872 --- Epoch 4 / 25 - 4 epochs total Iteration 0, loss = 0.0420 Iteration 20, loss = 0.2622 Iteration 40, loss = 0.1603 Iteration 60, loss = 0.0840 Iteration 80, loss = 0.1690 --- Epoch 5 / 25 - 5 epochs total Iteration 0, loss = 0.0431 Iteration 20, loss = 0.1285 Iteration 40, loss = 0.0655 Iteration 60, loss = 0.0661 Iteration 80, loss = 0.0665 --- Epoch 6 / 25 - 6 epochs total Iteration 0, loss = 0.0418 Iteration 20, loss = 0.0540 Iteration 40, loss = 0.1009 Iteration 60, loss = 0.0712 Iteration 80, loss = 0.0702 --- Epoch 7 / 25 - 7 epochs total Iteration 0, loss = 0.0361 Iteration 20, loss = 0.0178 Iteration 40, loss = 0.0333 Iteration 60, loss = 0.0257 Iteration 80, loss = 0.0402 --- Epoch 8 / 25 - 8 epochs total Iteration 0, loss = 0.0361 Iteration 20, loss = 0.0587 Iteration 40, loss = 0.0777 Iteration 60, loss = 0.0482 Iteration 80, loss = 0.0690 --- Epoch 9 / 25 - 9 epochs total Iteration 0, loss = 0.0463 Iteration 20, loss = 0.0761 Iteration 40, loss = 0.0588 Iteration 60, loss = 0.0356 Iteration 80, loss = 0.0691 --- Epoch 10 / 25 - 10 epochs total Iteration 0, loss = 0.0794 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0387 Iteration 60, loss = 0.0116 Iteration 80, loss = 0.0259 --- Epoch 11 / 25 - 11 epochs total Iteration 0, loss = 0.0665 Iteration 20, loss = 0.0568 Iteration 40, loss = 0.0544 Iteration 60, loss = 0.0923 Iteration 80, loss = 0.0191 --- Epoch 12 / 25 - 12 epochs total Iteration 0, loss = 0.0189 Iteration 20, loss = 0.0431 Iteration 40, loss = 0.0440 Iteration 60, loss = 0.0827 Iteration 80, loss = 0.0411 --- Epoch 13 / 25 - 13 epochs total Iteration 0, loss = 0.0408 Iteration 20, loss = 0.0383 Iteration 40, loss = 0.0811 Iteration 60, loss = 0.0319 Iteration 80, loss = 0.0371 --- Epoch 14 / 25 - 14 epochs total Iteration 0, loss = 0.0675 Iteration 20, loss = 0.0269 Iteration 40, loss = 0.0464 Iteration 60, loss = 0.0359 Iteration 80, loss = 0.0777 --- Epoch 15 / 25 - 15 epochs total Iteration 0, loss = 0.0494 Iteration 20, loss = 0.0465 Iteration 40, loss = 0.0550 Iteration 60, loss = 0.0470 Iteration 80, loss = 0.0217 --- Epoch 16 / 25 - 16 epochs total Iteration 0, loss = 0.0241 Iteration 20, loss = 0.0531 Iteration 40, loss = 0.0545 Iteration 60, loss = 0.0363 Iteration 80, loss = 0.0274 --- Epoch 17 / 25 - 17 epochs total Iteration 0, loss = 0.0668 Iteration 20, loss = 0.0375 Iteration 40, loss = 0.0313 Iteration 60, loss = 0.0566 Iteration 80, loss = 0.0603 --- Epoch 18 / 25 - 18 epochs total Iteration 0, loss = 0.0432 Iteration 20, loss = 0.0534 Iteration 40, loss = 0.0431 Iteration 60, loss = 0.0287 Iteration 80, loss = 0.0745 --- Epoch 19 / 25 - 19 epochs total Iteration 0, loss = 0.0599 Iteration 20, loss = 0.0335 Iteration 40, loss = 0.0950 Iteration 60, loss = 0.0310 Iteration 80, loss = 0.0671 --- Epoch 20 / 25 - 20 epochs total Iteration 0, loss = 0.0641 Iteration 20, loss = 0.0458 Iteration 40, loss = 0.0320 Iteration 60, loss = 0.0294 Iteration 80, loss = 0.0455 --- Epoch 21 / 25 - 21 epochs total Iteration 0, loss = 0.0222 Iteration 20, loss = 0.0361 Iteration 40, loss = 0.0441 Iteration 60, loss = 0.0221 Iteration 80, loss = 0.0387 --- Epoch 22 / 25 - 22 epochs total Iteration 0, loss = 0.0297 Iteration 20, loss = 0.0431 Iteration 40, loss = 0.0498 Iteration 60, loss = 0.0388 Iteration 80, loss = 0.0436 --- Epoch 23 / 25 - 23 epochs total Iteration 0, loss = 0.0531 Iteration 20, loss = 0.0676 Iteration 40, loss = 0.0386 Iteration 60, loss = 0.0482 Iteration 80, loss = 0.0523 --- Epoch 24 / 25 - 24 epochs total Iteration 0, loss = 0.0627 Iteration 20, loss = 0.0386 Iteration 40, loss = 0.0173 Iteration 60, loss = 0.0525 Iteration 80, loss = 0.0631 --- Epoch 25 / 25 - 25 epochs total Iteration 0, loss = 0.0793 Iteration 20, loss = 0.0748 Iteration 40, loss = 0.0250 Iteration 60, loss = 0.0448 Iteration 80, loss = 0.0378
testModel(model2)
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
class ConvNet(nn.Module):
def __init__(self):
super().__init__()
self.epochsTrained = 0
self.batchnorm48 = nn.BatchNorm2d(24)
self.batchnorm24 = nn.BatchNorm2d(12)
self.conv1 = nn.Conv2d(3, 24, kernel_size=5, stride=1, padding=0) # 48 3x3 filters
self.conv2 = nn.Conv2d(24, 24, kernel_size=4, stride=1, padding=0) # 48 3x3 filters
self.conv3 = nn.Conv2d(24, 12, kernel_size=3, stride=1, padding=0) # 24 3x3 filters
self.fc = nn.Linear(9420, 32 * 32 * 3)
def forward(self, x):
x2 = x.unsqueeze(0)
scores = self.batchnorm48(F.relu(self.conv1(x2)));
scores = self.batchnorm48(F.relu(self.conv2(scores)));
scores = self.batchnorm24(F.relu(self.conv3(scores)));
with_x = torch.cat((scores.view(-1), x.view(-1)), 0)
scores = self.fc(with_x)
return scores
learning_rate = 1e-2
model3 = ConvNet()
optimizer = optim.SGD(model3.parameters(), lr=learning_rate)
train(model3, optimizer, epochs=50)
--- Epoch 1 / 50 - 1 epochs total Iteration 0, loss = 0.4640 Iteration 20, loss = 0.6072 Iteration 40, loss = 0.3148 Iteration 60, loss = 0.4069 Iteration 80, loss = 0.4691 --- Epoch 2 / 50 - 2 epochs total Iteration 0, loss = 0.3967 Iteration 20, loss = 0.2838 Iteration 40, loss = 0.3281 Iteration 60, loss = 0.2043 Iteration 80, loss = 0.2292 --- Epoch 3 / 50 - 3 epochs total Iteration 0, loss = 0.1746 Iteration 20, loss = 0.2492 Iteration 40, loss = 0.3015 Iteration 60, loss = 0.2115 Iteration 80, loss = 0.1473 --- Epoch 4 / 50 - 4 epochs total Iteration 0, loss = 0.2002 Iteration 20, loss = 0.1324 Iteration 40, loss = 0.1655 Iteration 60, loss = 0.1047 Iteration 80, loss = 0.1279 --- Epoch 5 / 50 - 5 epochs total Iteration 0, loss = 0.0658 Iteration 20, loss = 0.1138 Iteration 40, loss = 0.0834 Iteration 60, loss = 0.0691 Iteration 80, loss = 0.1292 --- Epoch 6 / 50 - 6 epochs total Iteration 0, loss = 0.0616 Iteration 20, loss = 0.0694 Iteration 40, loss = 0.0584 Iteration 60, loss = 0.0816 Iteration 80, loss = 0.0577 --- Epoch 7 / 50 - 7 epochs total Iteration 0, loss = 0.1324 Iteration 20, loss = 0.0863 Iteration 40, loss = 0.0708 Iteration 60, loss = 0.0754 Iteration 80, loss = 0.0538 --- Epoch 8 / 50 - 8 epochs total Iteration 0, loss = 0.0802 Iteration 20, loss = 0.0406 Iteration 40, loss = 0.1031 Iteration 60, loss = 0.0588 Iteration 80, loss = 0.0686 --- Epoch 9 / 50 - 9 epochs total Iteration 0, loss = 0.1652 Iteration 20, loss = 0.0631 Iteration 40, loss = 0.0613 Iteration 60, loss = 0.0669 Iteration 80, loss = 0.0380 --- Epoch 10 / 50 - 10 epochs total Iteration 0, loss = 0.0784 Iteration 20, loss = 0.0547 Iteration 40, loss = 0.0615 Iteration 60, loss = 0.0810 Iteration 80, loss = 0.0512 --- Epoch 11 / 50 - 11 epochs total Iteration 0, loss = 0.0210 Iteration 20, loss = 0.0955 Iteration 40, loss = 0.0307 Iteration 60, loss = 0.0660 Iteration 80, loss = 0.0666 --- Epoch 12 / 50 - 12 epochs total Iteration 0, loss = 0.0620 Iteration 20, loss = 0.0627 Iteration 40, loss = 0.0634 Iteration 60, loss = 0.0754 Iteration 80, loss = 0.0725 --- Epoch 13 / 50 - 13 epochs total Iteration 0, loss = 0.0478 Iteration 20, loss = 0.0635 Iteration 40, loss = 0.0587 Iteration 60, loss = 0.0401 Iteration 80, loss = 0.0480 --- Epoch 14 / 50 - 14 epochs total Iteration 0, loss = 0.0413 Iteration 20, loss = 0.0322 Iteration 40, loss = 0.0501 Iteration 60, loss = 0.0378 Iteration 80, loss = 0.0433 --- Epoch 15 / 50 - 15 epochs total Iteration 0, loss = 0.0587 Iteration 20, loss = 0.0390 Iteration 40, loss = 0.0298 Iteration 60, loss = 0.0265 Iteration 80, loss = 0.0504 --- Epoch 16 / 50 - 16 epochs total Iteration 0, loss = 0.0631 Iteration 20, loss = 0.0567 Iteration 40, loss = 0.0511 Iteration 60, loss = 0.0489 Iteration 80, loss = 0.0436 --- Epoch 17 / 50 - 17 epochs total Iteration 0, loss = 0.0723 Iteration 20, loss = 0.0434 Iteration 40, loss = 0.0835 Iteration 60, loss = 0.0518 Iteration 80, loss = 0.1040 --- Epoch 18 / 50 - 18 epochs total Iteration 0, loss = 0.0448 Iteration 20, loss = 0.0658 Iteration 40, loss = 0.0714 Iteration 60, loss = 0.0629 Iteration 80, loss = 0.0710 --- Epoch 19 / 50 - 19 epochs total Iteration 0, loss = 0.0361 Iteration 20, loss = 0.0423 Iteration 40, loss = 0.0460 Iteration 60, loss = 0.0197 Iteration 80, loss = 0.0468 --- Epoch 20 / 50 - 20 epochs total Iteration 0, loss = 0.0461 Iteration 20, loss = 0.0503 Iteration 40, loss = 0.0350 Iteration 60, loss = 0.0665 Iteration 80, loss = 0.0705 --- Epoch 21 / 50 - 21 epochs total Iteration 0, loss = 0.0350 Iteration 20, loss = 0.0433 Iteration 40, loss = 0.0592 Iteration 60, loss = 0.0395 Iteration 80, loss = 0.0410 --- Epoch 22 / 50 - 22 epochs total Iteration 0, loss = 0.0369 Iteration 20, loss = 0.0385 Iteration 40, loss = 0.0337 Iteration 60, loss = 0.0424 Iteration 80, loss = 0.0314 --- Epoch 23 / 50 - 23 epochs total Iteration 0, loss = 0.0529 Iteration 20, loss = 0.0471 Iteration 40, loss = 0.0548 Iteration 60, loss = 0.0590 Iteration 80, loss = 0.0609 --- Epoch 24 / 50 - 24 epochs total Iteration 0, loss = 0.0198 Iteration 20, loss = 0.0695 Iteration 40, loss = 0.0591 Iteration 60, loss = 0.0346 Iteration 80, loss = 0.0626 --- Epoch 25 / 50 - 25 epochs total Iteration 0, loss = 0.0495 Iteration 20, loss = 0.0444 Iteration 40, loss = 0.0306 Iteration 60, loss = 0.0263 Iteration 80, loss = 0.0384 --- Epoch 26 / 50 - 26 epochs total Iteration 0, loss = 0.0502 Iteration 20, loss = 0.0604 Iteration 40, loss = 0.0319 Iteration 60, loss = 0.0243 Iteration 80, loss = 0.0575 --- Epoch 27 / 50 - 27 epochs total Iteration 0, loss = 0.0354 Iteration 20, loss = 0.0336 Iteration 40, loss = 0.0672 Iteration 60, loss = 0.0593 Iteration 80, loss = 0.0332 --- Epoch 28 / 50 - 28 epochs total Iteration 0, loss = 0.0344 Iteration 20, loss = 0.0280 Iteration 40, loss = 0.0215 Iteration 60, loss = 0.0270 Iteration 80, loss = 0.0566 --- Epoch 29 / 50 - 29 epochs total Iteration 0, loss = 0.0398 Iteration 20, loss = 0.0439 Iteration 40, loss = 0.0233 Iteration 60, loss = 0.0339 Iteration 80, loss = 0.0299 --- Epoch 30 / 50 - 30 epochs total Iteration 0, loss = 0.0281 Iteration 20, loss = 0.0432 Iteration 40, loss = 0.0421 Iteration 60, loss = 0.0353 Iteration 80, loss = 0.0378 --- Epoch 31 / 50 - 31 epochs total Iteration 0, loss = 0.0339 Iteration 20, loss = 0.0268 Iteration 40, loss = 0.0414 Iteration 60, loss = 0.0233 Iteration 80, loss = 0.0343 --- Epoch 32 / 50 - 32 epochs total Iteration 0, loss = 0.0312 Iteration 20, loss = 0.0274 Iteration 40, loss = 0.0481 Iteration 60, loss = 0.0209 Iteration 80, loss = 0.0338 --- Epoch 33 / 50 - 33 epochs total Iteration 0, loss = 0.0281 Iteration 20, loss = 0.0562 Iteration 40, loss = 0.0288 Iteration 60, loss = 0.0451 Iteration 80, loss = 0.0420 --- Epoch 34 / 50 - 34 epochs total Iteration 0, loss = 0.0306 Iteration 20, loss = 0.0394 Iteration 40, loss = 0.0407 Iteration 60, loss = 0.0206 Iteration 80, loss = 0.0593 --- Epoch 35 / 50 - 35 epochs total Iteration 0, loss = 0.0292 Iteration 20, loss = 0.0303 Iteration 40, loss = 0.0340 Iteration 60, loss = 0.0511 Iteration 80, loss = 0.0219 --- Epoch 36 / 50 - 36 epochs total Iteration 0, loss = 0.0402 Iteration 20, loss = 0.0206 Iteration 40, loss = 0.0390 Iteration 60, loss = 0.0335 Iteration 80, loss = 0.0423 --- Epoch 37 / 50 - 37 epochs total Iteration 0, loss = 0.0245 Iteration 20, loss = 0.0332 Iteration 40, loss = 0.0388 Iteration 60, loss = 0.0289 Iteration 80, loss = 0.0292 --- Epoch 38 / 50 - 38 epochs total Iteration 0, loss = 0.0372 Iteration 20, loss = 0.0211 Iteration 40, loss = 0.0418 Iteration 60, loss = 0.0306 Iteration 80, loss = 0.0417 --- Epoch 39 / 50 - 39 epochs total Iteration 0, loss = 0.0335 Iteration 20, loss = 0.1187 Iteration 40, loss = 0.0342 Iteration 60, loss = 0.0413 Iteration 80, loss = 0.0367 --- Epoch 40 / 50 - 40 epochs total Iteration 0, loss = 0.0327 Iteration 20, loss = 0.0363 Iteration 40, loss = 0.0793 Iteration 60, loss = 0.0334 Iteration 80, loss = 0.0324 --- Epoch 41 / 50 - 41 epochs total Iteration 0, loss = 0.0254 Iteration 20, loss = 0.0336 Iteration 40, loss = 0.0627 Iteration 60, loss = 0.0296 Iteration 80, loss = 0.0430 --- Epoch 42 / 50 - 42 epochs total Iteration 0, loss = 0.0211 Iteration 20, loss = 0.0271 Iteration 40, loss = 0.0326 Iteration 60, loss = 0.0313 Iteration 80, loss = 0.0233 --- Epoch 43 / 50 - 43 epochs total Iteration 0, loss = 0.0271 Iteration 20, loss = 0.0390 Iteration 40, loss = 0.0335 Iteration 60, loss = 0.0272 Iteration 80, loss = 0.0192 --- Epoch 44 / 50 - 44 epochs total Iteration 0, loss = 0.0207 Iteration 20, loss = 0.0490 Iteration 40, loss = 0.0306 Iteration 60, loss = 0.0333 Iteration 80, loss = 0.0384 --- Epoch 45 / 50 - 45 epochs total Iteration 0, loss = 0.0321 Iteration 20, loss = 0.0427 Iteration 40, loss = 0.0443 Iteration 60, loss = 0.0243 Iteration 80, loss = 0.0163 --- Epoch 46 / 50 - 46 epochs total Iteration 0, loss = 0.0286 Iteration 20, loss = 0.0669 Iteration 40, loss = 0.0432 Iteration 60, loss = 0.0391 Iteration 80, loss = 0.0431 --- Epoch 47 / 50 - 47 epochs total Iteration 0, loss = 0.0348 Iteration 20, loss = 0.0540 Iteration 40, loss = 0.0531 Iteration 60, loss = 0.0498 Iteration 80, loss = 0.0196 --- Epoch 48 / 50 - 48 epochs total Iteration 0, loss = 0.0172 Iteration 20, loss = 0.0176 Iteration 40, loss = 0.0553 Iteration 60, loss = 0.0299 Iteration 80, loss = 0.0244 --- Epoch 49 / 50 - 49 epochs total Iteration 0, loss = 0.0242 Iteration 20, loss = 0.0572 Iteration 40, loss = 0.0327 Iteration 60, loss = 0.0355 Iteration 80, loss = 0.0435 --- Epoch 50 / 50 - 50 epochs total Iteration 0, loss = 0.0332 Iteration 20, loss = 0.0262 Iteration 40, loss = 0.0292 Iteration 60, loss = 0.0533 Iteration 80, loss = 0.0221
testModel(model3)
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
def detectEdges(image):
ret = torch.zeros(image.shape)
filter = torch.tensor([[-1, -1, -1], [-1, 8, -1], [-1, -1, -1]]).to(device=device, dtype=dtype).view(1, 1, 3, 3)
grayscale = image[0, :, :].view(1, 1, 32, 32)
edges = F.conv2d(grayscale, filter, padding=1)
edges = edges[0][0]
# edges = ndimage.convolve(grayscale, filter, mode='constant', cval=0.0)
ret[0, :, :] = edges
ret[1, :, :] = edges
ret[2, :, :] = edges
ret[ret < 0.15] = 0
ret[ret > 0.15] = 1
return ret
Test edge detection
n = 10
idx = np.random.choice(range(data["X_test"].shape[0]), n)
fig, axs = plt.subplots(n, 3)
fig.set_size_inches(10, 25)
# Set axis titles
axs[0, 0].title.set_text('X data')
axs[0, 1].title.set_text('Edges')
axs[0, 2].title.set_text('Actual')
for i in range(n):
x_data = data["X_test"][idx[i]]
y_data = data["y_test"][idx[i]]
axs[i, 0].imshow(x_data.transpose(1, 2, 0))
axs[i, 1].imshow(detectEdges(torch.from_numpy(y_data).to(device=device, dtype=dtype)).detach().numpy().transpose(1, 2, 0))
axs[i, 2].imshow(y_data.transpose(1, 2, 0))
Build custom loss functions using adjacent difference to smoothen results and edge detection to keep image structure (Edge detection loss didnt work well in any of my tests so it is not widely used later on)
def custom_loss(output, target):
output = output.view(3, 32, 32)
target = target.view(3, 32, 32)
# Overall mean squared error
color_loss = torch.mean((output - target) ** 2)
# Take difference between adjacent pixels into account to smoothen results
horizontal_loss = torch.mean((output[:, 1:] - output[:, :-1]) ** 2)
vertical_loss = torch.mean((output[1:, :] - output[:-1, :]) ** 2)
loss = color_loss * 0.8 + horizontal_loss * 0.1 + vertical_loss * 0.11
return loss
def custom_loss_edges(output, target):
output = output.view(3, 32, 32)
target = target.view(3, 32, 32)
output_edges = detectEdges(output)
target_edges = detectEdges(target)
edge_loss = torch.mean((output_edges - target_edges) ** 2)
color_loss = torch.mean((output - target) ** 2)
horizontal_loss = torch.mean((output[:, 1:] - output[:, :-1]) ** 2)
vertical_loss = torch.mean((output[1:, :] - output[:-1, :]) ** 2)
loss = color_loss * 0.6 + horizontal_loss * 0.1 + vertical_loss * 0.1 + edge_loss * 0.2
return loss
learning_rate = 1e-2
model4 = ConvNet()
optimizer = optim.SGD(model4.parameters(), lr=learning_rate)
train(model4, optimizer, epochs=300, criterion=custom_loss)
--- Epoch 1 / 300 Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0125 Iteration 80, loss = 0.0049 --- Epoch 2 / 300 Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0119 --- Epoch 3 / 300 Iteration 0, loss = 0.0120 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0176 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0149 --- Epoch 4 / 300 Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0100 Iteration 40, loss = 0.0185 Iteration 60, loss = 0.0155 Iteration 80, loss = 0.0162 --- Epoch 5 / 300 Iteration 0, loss = 0.0103 Iteration 20, loss = 0.0117 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0195 Iteration 80, loss = 0.0104 --- Epoch 6 / 300 Iteration 0, loss = 0.0161 Iteration 20, loss = 0.0251 Iteration 40, loss = 0.0237 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0178 --- Epoch 7 / 300 Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0073 --- Epoch 8 / 300 Iteration 0, loss = 0.0141 Iteration 20, loss = 0.0271 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0091 --- Epoch 9 / 300 Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0149 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0136 --- Epoch 10 / 300 Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0150 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0126 Iteration 80, loss = 0.0070 --- Epoch 11 / 300 Iteration 0, loss = 0.0123 Iteration 20, loss = 0.0145 Iteration 40, loss = 0.0092 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0216 --- Epoch 12 / 300 Iteration 0, loss = 0.0196 Iteration 20, loss = 0.0195 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0117 Iteration 80, loss = 0.0098 --- Epoch 13 / 300 Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0181 Iteration 40, loss = 0.0167 Iteration 60, loss = 0.0199 Iteration 80, loss = 0.0089 --- Epoch 14 / 300 Iteration 0, loss = 0.0207 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0260 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0170 --- Epoch 15 / 300 Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0269 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0132 Iteration 80, loss = 0.0063 --- Epoch 16 / 300 Iteration 0, loss = 0.0097 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0121 Iteration 60, loss = 0.0146 Iteration 80, loss = 0.0156 --- Epoch 17 / 300 Iteration 0, loss = 0.0252 Iteration 20, loss = 0.0138 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0183 Iteration 80, loss = 0.0112 --- Epoch 18 / 300 Iteration 0, loss = 0.0192 Iteration 20, loss = 0.0151 Iteration 40, loss = 0.0184 Iteration 60, loss = 0.0173 Iteration 80, loss = 0.0152 --- Epoch 19 / 300 Iteration 0, loss = 0.0294 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0150 Iteration 60, loss = 0.0131 Iteration 80, loss = 0.0097 --- Epoch 20 / 300 Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0203 Iteration 40, loss = 0.0156 Iteration 60, loss = 0.0228 Iteration 80, loss = 0.0178 --- Epoch 21 / 300 Iteration 0, loss = 0.0166 Iteration 20, loss = 0.0155 Iteration 40, loss = 0.0133 Iteration 60, loss = 0.0161 Iteration 80, loss = 0.0061 --- Epoch 22 / 300 Iteration 0, loss = 0.0203 Iteration 20, loss = 0.0222 Iteration 40, loss = 0.0139 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0090 --- Epoch 23 / 300 Iteration 0, loss = 0.0130 Iteration 20, loss = 0.0171 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0164 --- Epoch 24 / 300 Iteration 0, loss = 0.0153 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0081 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0144 --- Epoch 25 / 300 Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0402 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0100 --- Epoch 26 / 300 Iteration 0, loss = 0.0188 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0170 Iteration 60, loss = 0.0146 Iteration 80, loss = 0.0146 --- Epoch 27 / 300 Iteration 0, loss = 0.0237 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0168 Iteration 60, loss = 0.0179 Iteration 80, loss = 0.0120 --- Epoch 28 / 300 Iteration 0, loss = 0.0140 Iteration 20, loss = 0.0180 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0097 Iteration 80, loss = 0.0250 --- Epoch 29 / 300 Iteration 0, loss = 0.0101 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0178 Iteration 80, loss = 0.0130 --- Epoch 30 / 300 Iteration 0, loss = 0.0150 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0108 Iteration 80, loss = 0.0059 --- Epoch 31 / 300 Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0090 Iteration 60, loss = 0.0102 Iteration 80, loss = 0.0145 --- Epoch 32 / 300 Iteration 0, loss = 0.0354 Iteration 20, loss = 0.0159 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0216 Iteration 80, loss = 0.0199 --- Epoch 33 / 300 Iteration 0, loss = 0.0212 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0142 Iteration 60, loss = 0.0116 Iteration 80, loss = 0.0138 --- Epoch 34 / 300 Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0182 Iteration 40, loss = 0.0167 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0172 --- Epoch 35 / 300 Iteration 0, loss = 0.0096 Iteration 20, loss = 0.0174 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0131 Iteration 80, loss = 0.0421 --- Epoch 36 / 300 Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0165 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0147 --- Epoch 37 / 300 Iteration 0, loss = 0.0250 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0691 Iteration 60, loss = 0.0144 Iteration 80, loss = 0.0110 --- Epoch 38 / 300 Iteration 0, loss = 0.0097 Iteration 20, loss = 0.0111 Iteration 40, loss = 0.0209 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0112 --- Epoch 39 / 300 Iteration 0, loss = 0.0185 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0167 Iteration 60, loss = 0.0316 Iteration 80, loss = 0.0193 --- Epoch 40 / 300 Iteration 0, loss = 0.0179 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0241 Iteration 80, loss = 0.0086 --- Epoch 41 / 300 Iteration 0, loss = 0.0179 Iteration 20, loss = 0.0159 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0096 --- Epoch 42 / 300 Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0148 Iteration 40, loss = 0.0167 Iteration 60, loss = 0.0114 Iteration 80, loss = 0.0130 --- Epoch 43 / 300 Iteration 0, loss = 0.0128 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0216 Iteration 60, loss = 0.0116 Iteration 80, loss = 0.0194 --- Epoch 44 / 300 Iteration 0, loss = 0.0126 Iteration 20, loss = 0.0096 Iteration 40, loss = 0.0126 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0202 --- Epoch 45 / 300 Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0176 Iteration 40, loss = 0.0203 Iteration 60, loss = 0.0123 Iteration 80, loss = 0.0105 --- Epoch 46 / 300 Iteration 0, loss = 0.0101 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0179 Iteration 80, loss = 0.0149 --- Epoch 47 / 300 Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0157 Iteration 40, loss = 0.0254 Iteration 60, loss = 0.0229 Iteration 80, loss = 0.0160 --- Epoch 48 / 300 Iteration 0, loss = 0.0211 Iteration 20, loss = 0.0170 Iteration 40, loss = 0.0092 Iteration 60, loss = 0.0135 Iteration 80, loss = 0.0102 --- Epoch 49 / 300 Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0166 Iteration 40, loss = 0.0180 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0071 --- Epoch 50 / 300 Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0128 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0131 --- Epoch 51 / 300 Iteration 0, loss = 0.0082 Iteration 20, loss = 0.0133 Iteration 40, loss = 0.0093 Iteration 60, loss = 0.0188 Iteration 80, loss = 0.0120 --- Epoch 52 / 300 Iteration 0, loss = 0.0199 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0187 Iteration 80, loss = 0.0241 --- Epoch 53 / 300 Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0259 Iteration 40, loss = 0.0297 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0121 --- Epoch 54 / 300 Iteration 0, loss = 0.0173 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0150 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0102 --- Epoch 55 / 300 Iteration 0, loss = 0.0096 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0097 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0293 --- Epoch 56 / 300 Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0106 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0176 --- Epoch 57 / 300 Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0134 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0188 Iteration 80, loss = 0.0059 --- Epoch 58 / 300 Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0145 Iteration 80, loss = 0.0094 --- Epoch 59 / 300 Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0166 --- Epoch 60 / 300 Iteration 0, loss = 0.0217 Iteration 20, loss = 0.0137 Iteration 40, loss = 0.0147 Iteration 60, loss = 0.0146 Iteration 80, loss = 0.0113 --- Epoch 61 / 300 Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0221 Iteration 40, loss = 0.0214 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0072 --- Epoch 62 / 300 Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0165 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0162 Iteration 80, loss = 0.0184 --- Epoch 63 / 300 Iteration 0, loss = 0.0173 Iteration 20, loss = 0.0212 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0123 --- Epoch 64 / 300 Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0157 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0093 --- Epoch 65 / 300 Iteration 0, loss = 0.0157 Iteration 20, loss = 0.0213 Iteration 40, loss = 0.0199 Iteration 60, loss = 0.0164 Iteration 80, loss = 0.0090 --- Epoch 66 / 300 Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0212 Iteration 60, loss = 0.0165 Iteration 80, loss = 0.0039 --- Epoch 67 / 300 Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0204 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0134 --- Epoch 68 / 300 Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0212 Iteration 60, loss = 0.0128 Iteration 80, loss = 0.0088 --- Epoch 69 / 300 Iteration 0, loss = 0.0314 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0128 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0103 --- Epoch 70 / 300 Iteration 0, loss = 0.0084 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0084 --- Epoch 71 / 300 Iteration 0, loss = 0.0155 Iteration 20, loss = 0.0140 Iteration 40, loss = 0.0131 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0125 --- Epoch 72 / 300 Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0132 Iteration 40, loss = 0.0223 Iteration 60, loss = 0.0227 Iteration 80, loss = 0.0034 --- Epoch 73 / 300 Iteration 0, loss = 0.0083 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0134 Iteration 60, loss = 0.0145 Iteration 80, loss = 0.0091 --- Epoch 74 / 300 Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0109 Iteration 40, loss = 0.0140 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0264 --- Epoch 75 / 300 Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0109 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0144 --- Epoch 76 / 300 Iteration 0, loss = 0.0083 Iteration 20, loss = 0.0196 Iteration 40, loss = 0.0223 Iteration 60, loss = 0.0211 Iteration 80, loss = 0.0163 --- Epoch 77 / 300 Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0268 Iteration 40, loss = 0.0084 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0112
--------------------------------------------------------------------------- KeyboardInterrupt Traceback (most recent call last) <ipython-input-452-13970f5e6e2d> in <module> ----> 1 train(model4, optimizer, epochs=300, criterion=custom_loss) <ipython-input-5-6d69c0665347> in train(model, optimizer, epochs, criterion) 34 # Zero out all of the gradients for the variables which the optimizer 35 # will update. ---> 36 optimizer.zero_grad() 37 38 # This is the backwards pass: compute the gradient of the loss with KeyboardInterrupt:
testModel(model4)
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
learning_rate = 1e-2
model5 = ConvNet()
optimizer = optim.SGD(model5.parameters(), lr=learning_rate)
train(model5, optimizer, epochs=300, criterion=custom_loss_edges)
--- Epoch 1 / 300 Iteration 0, loss = 0.1264 Iteration 20, loss = 0.0959 Iteration 40, loss = 0.0950 Iteration 60, loss = 0.1142 Iteration 80, loss = 0.1146 --- Epoch 2 / 300 Iteration 0, loss = 0.1114 Iteration 20, loss = 0.0938 Iteration 40, loss = 0.0967 Iteration 60, loss = 0.1293 Iteration 80, loss = 0.1029 --- Epoch 3 / 300 Iteration 0, loss = 0.1161 Iteration 20, loss = 0.1257 Iteration 40, loss = 0.1162 Iteration 60, loss = 0.1176 Iteration 80, loss = 0.0968 --- Epoch 4 / 300 Iteration 0, loss = 0.0887 Iteration 20, loss = 0.1108 Iteration 40, loss = 0.0977 Iteration 60, loss = 0.1076 Iteration 80, loss = 0.0902 --- Epoch 5 / 300 Iteration 0, loss = 0.1177 Iteration 20, loss = 0.0982 Iteration 40, loss = 0.0957 Iteration 60, loss = 0.1109 Iteration 80, loss = 0.1038 --- Epoch 6 / 300 Iteration 0, loss = 0.0996 Iteration 20, loss = 0.0890 Iteration 40, loss = 0.1083 Iteration 60, loss = 0.1139 Iteration 80, loss = 0.1148 --- Epoch 7 / 300 Iteration 0, loss = 0.1036 Iteration 20, loss = 0.1009 Iteration 40, loss = 0.0886 Iteration 60, loss = 0.0989 Iteration 80, loss = 0.1176 --- Epoch 8 / 300 Iteration 0, loss = 0.0981 Iteration 20, loss = 0.1265 Iteration 40, loss = 0.1045 Iteration 60, loss = 0.1128 Iteration 80, loss = 0.0987 --- Epoch 9 / 300 Iteration 0, loss = 0.0919 Iteration 20, loss = 0.1085 Iteration 40, loss = 0.1061 Iteration 60, loss = 0.1128 Iteration 80, loss = 0.1039 --- Epoch 10 / 300 Iteration 0, loss = 0.1030 Iteration 20, loss = 0.0932 Iteration 40, loss = 0.1131 Iteration 60, loss = 0.1318 Iteration 80, loss = 0.1277 --- Epoch 11 / 300 Iteration 0, loss = 0.1366 Iteration 20, loss = 0.1155 Iteration 40, loss = 0.1211 Iteration 60, loss = 0.0946 Iteration 80, loss = 0.1204 --- Epoch 12 / 300 Iteration 0, loss = 0.1139 Iteration 20, loss = 0.0945 Iteration 40, loss = 0.0955 Iteration 60, loss = 0.1091 Iteration 80, loss = 0.0902 --- Epoch 13 / 300 Iteration 0, loss = 0.1126 Iteration 20, loss = 0.0948 Iteration 40, loss = 0.0972 Iteration 60, loss = 0.0968 Iteration 80, loss = 0.1454 --- Epoch 14 / 300 Iteration 0, loss = 0.1354 Iteration 20, loss = 0.1142 Iteration 40, loss = 0.0934 Iteration 60, loss = 0.1096 Iteration 80, loss = 0.0959
--------------------------------------------------------------------------- KeyboardInterrupt Traceback (most recent call last) <ipython-input-72-157c50dede99> in <module> ----> 1 train(model5, optimizer, epochs=300, criterion=custom_loss_edges) <ipython-input-6-6d69c0665347> in train(model, optimizer, epochs, criterion) 34 # Zero out all of the gradients for the variables which the optimizer 35 # will update. ---> 36 optimizer.zero_grad() 37 38 # This is the backwards pass: compute the gradient of the loss with /opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/optim/optimizer.py in zero_grad(self) 170 if p.grad is not None: 171 p.grad.detach_() --> 172 p.grad.zero_() 173 174 def step(self, closure): KeyboardInterrupt:
testModel(model5)
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
class ConvNet2(nn.Module):
def __init__(self):
super().__init__()
self.epochsTrained = 0
self.batchnorm1 = nn.BatchNorm2d(24)
self.batchnorm2 = nn.BatchNorm2d(24)
self.batchnorm3 = nn.BatchNorm2d(12)
self.batchnorm4 = nn.BatchNorm2d(12)
self.conv1 = nn.Conv2d(3, 24, kernel_size=6, stride=1, padding=2) # 48 6x6 filters
self.conv2 = nn.Conv2d(24, 24, kernel_size=4, stride=1, padding=1) # 48 4x4 filters
self.conv3 = nn.Conv2d(24, 12, kernel_size=4, stride=1, padding=1) # 24 4x4 filters
self.conv4 = nn.Conv2d(12, 12, kernel_size=3, stride=1, padding=1) # 24 3x3 filters
self.fc = nn.Linear(13164, 32 * 32 * 3)
def forward(self, x):
x2 = x.unsqueeze(0)
scores = self.batchnorm1(F.relu(self.conv1(x2)));
scores = self.batchnorm2(F.relu(self.conv2(scores)));
scores = self.batchnorm3(F.relu(self.conv3(scores)));
scores = self.batchnorm4(torch.tanh(self.conv4(scores)));
with_x = torch.cat((scores.view(-1), x.view(-1)), 0)
scores = self.fc(with_x)
return scores
learning_rate = 1e-2
model6 = ConvNet2()
optimizer = optim.SGD(model6.parameters(), lr=learning_rate)
train(model6, optimizer, epochs=250, criterion=custom_loss)
--- Epoch 1 / 250 Iteration 0, loss = 0.1323 Iteration 20, loss = 0.1473 Iteration 40, loss = 0.1414 Iteration 60, loss = 0.1272 Iteration 80, loss = 0.1903 --- Epoch 2 / 250 Iteration 0, loss = 0.0930 Iteration 20, loss = 0.0972 Iteration 40, loss = 0.1379 Iteration 60, loss = 0.0825 Iteration 80, loss = 0.1351 --- Epoch 3 / 250 Iteration 0, loss = 0.1339 Iteration 20, loss = 0.1859 Iteration 40, loss = 0.1257 Iteration 60, loss = 0.1184 Iteration 80, loss = 0.0991 --- Epoch 4 / 250 Iteration 0, loss = 0.1137 Iteration 20, loss = 0.0941 Iteration 40, loss = 0.1762 Iteration 60, loss = 0.1596 Iteration 80, loss = 0.1572 --- Epoch 5 / 250 Iteration 0, loss = 0.1331 Iteration 20, loss = 0.1142 Iteration 40, loss = 0.1244 Iteration 60, loss = 0.1387 Iteration 80, loss = 0.1038 --- Epoch 6 / 250 Iteration 0, loss = 0.0847 Iteration 20, loss = 0.1252 Iteration 40, loss = 0.1097 Iteration 60, loss = 0.1029 Iteration 80, loss = 0.1377 --- Epoch 7 / 250 Iteration 0, loss = 0.1077 Iteration 20, loss = 0.1487 Iteration 40, loss = 0.0997 Iteration 60, loss = 0.1337 Iteration 80, loss = 0.1576 --- Epoch 8 / 250 Iteration 0, loss = 0.1305 Iteration 20, loss = 0.1682 Iteration 40, loss = 0.1038 Iteration 60, loss = 0.1402 Iteration 80, loss = 0.1207 --- Epoch 9 / 250 Iteration 0, loss = 0.0850 Iteration 20, loss = 0.1723 Iteration 40, loss = 0.1478 Iteration 60, loss = 0.1355 Iteration 80, loss = 0.0900 --- Epoch 10 / 250 Iteration 0, loss = 0.0949 Iteration 20, loss = 0.1598 Iteration 40, loss = 0.1249 Iteration 60, loss = 0.0941 Iteration 80, loss = 0.1503 --- Epoch 11 / 250 Iteration 0, loss = 0.0915 Iteration 20, loss = 0.1141 Iteration 40, loss = 0.1179 Iteration 60, loss = 0.0786 Iteration 80, loss = 0.1332 --- Epoch 12 / 250 Iteration 0, loss = 0.1909 Iteration 20, loss = 0.1306
--------------------------------------------------------------------------- KeyboardInterrupt Traceback (most recent call last) <ipython-input-128-1446adb45ff8> in <module> ----> 1 train(model6, optimizer, epochs=250, criterion=custom_loss) <ipython-input-6-6d69c0665347> in train(model, optimizer, epochs, criterion) 38 # This is the backwards pass: compute the gradient of the loss with 39 # respect to each parameter of the model. ---> 40 loss.backward() 41 42 # Actually update the parameters of the model using the gradients /opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/tensor.py in backward(self, gradient, retain_graph, create_graph) 183 products. Defaults to ``False``. 184 """ --> 185 torch.autograd.backward(self, gradient, retain_graph, create_graph) 186 187 def register_hook(self, hook): /opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/autograd/__init__.py in backward(tensors, grad_tensors, retain_graph, create_graph, grad_variables) 125 Variable._execution_engine.run_backward( 126 tensors, grad_tensors, retain_graph, create_graph, --> 127 allow_unreachable=True) # allow_unreachable flag 128 129 KeyboardInterrupt:
testModel(model5)
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
Try training on a specific class type to make it easier for netowrk
classes = [ "airplane", "automobile", "bird", "cat", "deer", "dog", "frog", "horse", "ship", "truck"]
for c in range(len(classes)):
cname = classes[c]
train_idx = np.where(unproccessed_data["y_train"] == c)
test_idx = np.where(unproccessed_data["y_test"] == c)
val_idx = np.where(unproccessed_data["y_val"] == c)
data["y_train_" + cname] = unproccessed_data["X_train"][train_idx]
data["y_val_" + cname] = unproccessed_data["X_val"][val_idx]
data["y_test_" + cname] = unproccessed_data["X_test"][test_idx]
data["X_train_" + cname] = convertToBW(unproccessed_data["X_train"][train_idx]);
data["X_val_" + cname] = convertToBW(unproccessed_data["X_val"][val_idx]);
data["X_test_" + cname] = convertToBW(unproccessed_data["X_test"][test_idx]);
dict_keys(['y_train', 'y_val', 'y_test', 'X_train', 'X_val', 'X_test', 'y_train_airplane', 'y_val_airplane', 'y_test_airplane', 'X_train_airplane', 'X_val_airplane', 'X_test_airplane', 'y_train_automobile', 'y_val_automobile', 'y_test_automobile', 'X_train_automobile', 'X_val_automobile', 'X_test_automobile', 'y_train_bird', 'y_val_bird', 'y_test_bird', 'X_train_bird', 'X_val_bird', 'X_test_bird', 'y_train_cat', 'y_val_cat', 'y_test_cat', 'X_train_cat', 'X_val_cat', 'X_test_cat', 'y_train_deer', 'y_val_deer', 'y_test_deer', 'X_train_deer', 'X_val_deer', 'X_test_deer', 'y_train_dog', 'y_val_dog', 'y_test_dog', 'X_train_dog', 'X_val_dog', 'X_test_dog', 'y_train_frog', 'y_val_frog', 'y_test_frog', 'X_train_frog', 'X_val_frog', 'X_test_frog', 'y_train_horse', 'y_val_horse', 'y_test_horse', 'X_train_horse', 'X_val_horse', 'X_test_horse', 'y_train_ship', 'y_val_ship', 'y_test_ship', 'X_train_ship', 'X_val_ship', 'X_test_ship', 'y_train_truck', 'y_val_truck', 'y_test_truck', 'X_train_truck', 'X_val_truck', 'X_test_truck'])
learning_rate = 5e-3
model7 = ConvNet2()
optimizer = optim.SGD(model7.parameters(), lr=learning_rate)
train(model7, optimizer, epochs=1000, x_train=data["X_train_class"], y_train=data["y_train_class"], criterion=custom_loss)
--- Epoch 1 / 1000 Iteration 0, loss = 0.5163 Iteration 20, loss = 0.4907 Iteration 40, loss = 0.3813 Iteration 60, loss = 0.2225 Iteration 80, loss = 0.2141 --- Epoch 2 / 1000 Iteration 0, loss = 0.1437 Iteration 20, loss = 0.1209 Iteration 40, loss = 0.1181 Iteration 60, loss = 0.1140 Iteration 80, loss = 0.1295 --- Epoch 3 / 1000 Iteration 0, loss = 0.1044 Iteration 20, loss = 0.0945 Iteration 40, loss = 0.0883 Iteration 60, loss = 0.0771 Iteration 80, loss = 0.1358 --- Epoch 4 / 1000 Iteration 0, loss = 0.0540 Iteration 20, loss = 0.0467 Iteration 40, loss = 0.0336 Iteration 60, loss = 0.0385 Iteration 80, loss = 0.0180 --- Epoch 5 / 1000 Iteration 0, loss = 0.0517 Iteration 20, loss = 0.0614 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0386 Iteration 80, loss = 0.2632 --- Epoch 6 / 1000 Iteration 0, loss = 0.0245 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.1029 Iteration 60, loss = 0.0547 Iteration 80, loss = 0.0560 --- Epoch 7 / 1000 Iteration 0, loss = 0.0149 Iteration 20, loss = 0.0323 Iteration 40, loss = 0.0297 Iteration 60, loss = 0.0215 Iteration 80, loss = 0.0278 --- Epoch 8 / 1000 Iteration 0, loss = 0.0288 Iteration 20, loss = 0.0433 Iteration 40, loss = 0.0269 Iteration 60, loss = 0.0411 Iteration 80, loss = 0.0266 --- Epoch 9 / 1000 Iteration 0, loss = 0.0520 Iteration 20, loss = 0.0614 Iteration 40, loss = 0.0220 Iteration 60, loss = 0.0699 Iteration 80, loss = 0.0410 --- Epoch 10 / 1000 Iteration 0, loss = 0.0454 Iteration 20, loss = 0.2740 Iteration 40, loss = 0.0621 Iteration 60, loss = 0.0261 Iteration 80, loss = 0.0162 --- Epoch 11 / 1000 Iteration 0, loss = 0.0524 Iteration 20, loss = 0.1356 Iteration 40, loss = 0.0476 Iteration 60, loss = 0.0168 Iteration 80, loss = 0.0620 --- Epoch 12 / 1000 Iteration 0, loss = 0.0308 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0632 Iteration 60, loss = 0.0402 Iteration 80, loss = 0.0662 --- Epoch 13 / 1000 Iteration 0, loss = 0.0092 Iteration 20, loss = 0.1502 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0163 Iteration 80, loss = 0.0521 --- Epoch 14 / 1000 Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0221 Iteration 40, loss = 0.0472 Iteration 60, loss = 0.0219 Iteration 80, loss = 0.0227 --- Epoch 15 / 1000 Iteration 0, loss = 0.0262 Iteration 20, loss = 0.0331 Iteration 40, loss = 0.0581 Iteration 60, loss = 0.0273 Iteration 80, loss = 0.0097 --- Epoch 16 / 1000 Iteration 0, loss = 0.0416 Iteration 20, loss = 0.0209 Iteration 40, loss = 0.0172 Iteration 60, loss = 0.0391 Iteration 80, loss = 0.0136 --- Epoch 17 / 1000 Iteration 0, loss = 0.0163 Iteration 20, loss = 0.0383 Iteration 40, loss = 0.0239 Iteration 60, loss = 0.0339 Iteration 80, loss = 0.0503 --- Epoch 18 / 1000 Iteration 0, loss = 0.0419 Iteration 20, loss = 0.0180 Iteration 40, loss = 0.0152 Iteration 60, loss = 0.0313 Iteration 80, loss = 0.0396 --- Epoch 19 / 1000 Iteration 0, loss = 0.0203 Iteration 20, loss = 0.0398 Iteration 40, loss = 0.0220 Iteration 60, loss = 0.1211 Iteration 80, loss = 0.0583 --- Epoch 20 / 1000 Iteration 0, loss = 0.0395 Iteration 20, loss = 0.0629 Iteration 40, loss = 0.0217 Iteration 60, loss = 0.0135 Iteration 80, loss = 0.0304 --- Epoch 21 / 1000 Iteration 0, loss = 0.0188 Iteration 20, loss = 0.0313 Iteration 40, loss = 0.0239 Iteration 60, loss = 0.0747 Iteration 80, loss = 0.0119 --- Epoch 22 / 1000 Iteration 0, loss = 0.0401 Iteration 20, loss = 0.0099 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0185 --- Epoch 23 / 1000 Iteration 0, loss = 0.0225 Iteration 20, loss = 0.0245 Iteration 40, loss = 0.0240 Iteration 60, loss = 0.0128 Iteration 80, loss = 0.0425 --- Epoch 24 / 1000 Iteration 0, loss = 0.0215 Iteration 20, loss = 0.0117 Iteration 40, loss = 0.0301 Iteration 60, loss = 0.0595 Iteration 80, loss = 0.0138 --- Epoch 25 / 1000 Iteration 0, loss = 0.0402 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0263 Iteration 60, loss = 0.0313 Iteration 80, loss = 0.0091 --- Epoch 26 / 1000 Iteration 0, loss = 0.0198 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0317 Iteration 60, loss = 0.0206 Iteration 80, loss = 0.0406 --- Epoch 27 / 1000 Iteration 0, loss = 0.0377 Iteration 20, loss = 0.0367 Iteration 40, loss = 0.0697 Iteration 60, loss = 0.0375 Iteration 80, loss = 0.0241 --- Epoch 28 / 1000 Iteration 0, loss = 0.0295 Iteration 20, loss = 0.0183 Iteration 40, loss = 0.0169 Iteration 60, loss = 0.0361 Iteration 80, loss = 0.0107 --- Epoch 29 / 1000 Iteration 0, loss = 0.0550 Iteration 20, loss = 0.0414 Iteration 40, loss = 0.0296 Iteration 60, loss = 0.0179 Iteration 80, loss = 0.0166 --- Epoch 30 / 1000 Iteration 0, loss = 0.0230 Iteration 20, loss = 0.0165 Iteration 40, loss = 0.0400 Iteration 60, loss = 0.0717 Iteration 80, loss = 0.0482 --- Epoch 31 / 1000 Iteration 0, loss = 0.0391 Iteration 20, loss = 0.0224 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0201 Iteration 80, loss = 0.0165 --- Epoch 32 / 1000 Iteration 0, loss = 0.0379 Iteration 20, loss = 0.0352 Iteration 40, loss = 0.0183 Iteration 60, loss = 0.0624 Iteration 80, loss = 0.0251 --- Epoch 33 / 1000 Iteration 0, loss = 0.0240 Iteration 20, loss = 0.0300 Iteration 40, loss = 0.0416 Iteration 60, loss = 0.0236 Iteration 80, loss = 0.0365 --- Epoch 34 / 1000 Iteration 0, loss = 0.0231 Iteration 20, loss = 0.0346 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0113 Iteration 80, loss = 0.0182 --- Epoch 35 / 1000 Iteration 0, loss = 0.0196 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0253 Iteration 60, loss = 0.0188 Iteration 80, loss = 0.0393 --- Epoch 36 / 1000 Iteration 0, loss = 0.0299 Iteration 20, loss = 0.0293 Iteration 40, loss = 0.0411 Iteration 60, loss = 0.0381 Iteration 80, loss = 0.0346 --- Epoch 37 / 1000 Iteration 0, loss = 0.0211 Iteration 20, loss = 0.0241 Iteration 40, loss = 0.0253 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0234 --- Epoch 38 / 1000 Iteration 0, loss = 0.0458 Iteration 20, loss = 0.0430 Iteration 40, loss = 0.0123 Iteration 60, loss = 0.0342 Iteration 80, loss = 0.0122 --- Epoch 39 / 1000 Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0430 Iteration 40, loss = 0.0305 Iteration 60, loss = 0.0245 Iteration 80, loss = 0.0105 --- Epoch 40 / 1000 Iteration 0, loss = 0.0285 Iteration 20, loss = 0.0288 Iteration 40, loss = 0.0351 Iteration 60, loss = 0.0193 Iteration 80, loss = 0.0182 --- Epoch 41 / 1000 Iteration 0, loss = 0.0215 Iteration 20, loss = 0.0124 Iteration 40, loss = 0.0369 Iteration 60, loss = 0.0319 Iteration 80, loss = 0.0225 --- Epoch 42 / 1000 Iteration 0, loss = 0.0176 Iteration 20, loss = 0.0278 Iteration 40, loss = 0.0158 Iteration 60, loss = 0.0450 Iteration 80, loss = 0.0220 --- Epoch 43 / 1000 Iteration 0, loss = 0.0210 Iteration 20, loss = 0.0141 Iteration 40, loss = 0.0275 Iteration 60, loss = 0.0138 Iteration 80, loss = 0.0320 --- Epoch 44 / 1000 Iteration 0, loss = 0.0664 Iteration 20, loss = 0.0175 Iteration 40, loss = 0.0199 Iteration 60, loss = 0.0085 Iteration 80, loss = 0.0283 --- Epoch 45 / 1000 Iteration 0, loss = 0.0232 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0316 Iteration 60, loss = 0.0146 Iteration 80, loss = 0.0123 --- Epoch 46 / 1000 Iteration 0, loss = 0.0200 Iteration 20, loss = 0.0132 Iteration 40, loss = 0.0210 Iteration 60, loss = 0.0339 Iteration 80, loss = 0.0177 --- Epoch 47 / 1000 Iteration 0, loss = 0.0280 Iteration 20, loss = 0.0240 Iteration 40, loss = 0.0388 Iteration 60, loss = 0.0185 Iteration 80, loss = 0.0533 --- Epoch 48 / 1000 Iteration 0, loss = 0.0459 Iteration 20, loss = 0.0182 Iteration 40, loss = 0.0097 Iteration 60, loss = 0.0639 Iteration 80, loss = 0.0358 --- Epoch 49 / 1000 Iteration 0, loss = 0.0227 Iteration 20, loss = 0.0481 Iteration 40, loss = 0.0399 Iteration 60, loss = 0.0158 Iteration 80, loss = 0.0396 --- Epoch 50 / 1000 Iteration 0, loss = 0.0191 Iteration 20, loss = 0.0142 Iteration 40, loss = 0.0265 Iteration 60, loss = 0.0308 Iteration 80, loss = 0.0324 --- Epoch 51 / 1000 Iteration 0, loss = 0.0276 Iteration 20, loss = 0.0343 Iteration 40, loss = 0.0155 Iteration 60, loss = 0.0221 Iteration 80, loss = 0.0337 --- Epoch 52 / 1000 Iteration 0, loss = 0.0360 Iteration 20, loss = 0.0185 Iteration 40, loss = 0.0221 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0352 --- Epoch 53 / 1000 Iteration 0, loss = 0.0365 Iteration 20, loss = 0.0185 Iteration 40, loss = 0.0211 Iteration 60, loss = 0.0462 Iteration 80, loss = 0.0185 --- Epoch 54 / 1000 Iteration 0, loss = 0.0172 Iteration 20, loss = 0.0149 Iteration 40, loss = 0.0452 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0195 --- Epoch 55 / 1000 Iteration 0, loss = 0.0202 Iteration 20, loss = 0.0232 Iteration 40, loss = 0.0166 Iteration 60, loss = 0.0251 Iteration 80, loss = 0.0262 --- Epoch 56 / 1000 Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0177 Iteration 40, loss = 0.0215 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0312 --- Epoch 57 / 1000 Iteration 0, loss = 0.0200 Iteration 20, loss = 0.0347 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0166 Iteration 80, loss = 0.0248 --- Epoch 58 / 1000 Iteration 0, loss = 0.0280 Iteration 20, loss = 0.0231 Iteration 40, loss = 0.0176 Iteration 60, loss = 0.0302 Iteration 80, loss = 0.0135 --- Epoch 59 / 1000 Iteration 0, loss = 0.0239 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0205 Iteration 60, loss = 0.0321 Iteration 80, loss = 0.0263 --- Epoch 60 / 1000 Iteration 0, loss = 0.0213 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0420 Iteration 60, loss = 0.0288 Iteration 80, loss = 0.0458 --- Epoch 61 / 1000 Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0124 Iteration 40, loss = 0.0140 Iteration 60, loss = 0.0264 Iteration 80, loss = 0.0568 --- Epoch 62 / 1000 Iteration 0, loss = 0.0481 Iteration 20, loss = 0.0230 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0136 Iteration 80, loss = 0.0302 --- Epoch 63 / 1000 Iteration 0, loss = 0.0271 Iteration 20, loss = 0.0217 Iteration 40, loss = 0.0120 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0278 --- Epoch 64 / 1000 Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0439 Iteration 40, loss = 0.0184 Iteration 60, loss = 0.0288 Iteration 80, loss = 0.0240 --- Epoch 65 / 1000 Iteration 0, loss = 0.0308 Iteration 20, loss = 0.0133 Iteration 40, loss = 0.0164 Iteration 60, loss = 0.0172 Iteration 80, loss = 0.0070 --- Epoch 66 / 1000 Iteration 0, loss = 0.0419 Iteration 20, loss = 0.0496 Iteration 40, loss = 0.0151 Iteration 60, loss = 0.0143 Iteration 80, loss = 0.0146 --- Epoch 67 / 1000 Iteration 0, loss = 0.0520 Iteration 20, loss = 0.0169 Iteration 40, loss = 0.0399 Iteration 60, loss = 0.0223 Iteration 80, loss = 0.0188 --- Epoch 68 / 1000 Iteration 0, loss = 0.0240 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0268 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0098 --- Epoch 69 / 1000 Iteration 0, loss = 0.0826 Iteration 20, loss = 0.0194 Iteration 40, loss = 0.0347 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0188 --- Epoch 70 / 1000 Iteration 0, loss = 0.0217 Iteration 20, loss = 0.0117 Iteration 40, loss = 0.0173 Iteration 60, loss = 0.0216 Iteration 80, loss = 0.0166 --- Epoch 71 / 1000 Iteration 0, loss = 0.0323 Iteration 20, loss = 0.0216 Iteration 40, loss = 0.0229 Iteration 60, loss = 0.0577 Iteration 80, loss = 0.0388 --- Epoch 72 / 1000 Iteration 0, loss = 0.0289 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0189 Iteration 60, loss = 0.0230 Iteration 80, loss = 0.0085 --- Epoch 73 / 1000 Iteration 0, loss = 0.0295 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0258 Iteration 60, loss = 0.0294 Iteration 80, loss = 0.0128 --- Epoch 74 / 1000 Iteration 0, loss = 0.0415 Iteration 20, loss = 0.0526 Iteration 40, loss = 0.0114 Iteration 60, loss = 0.0283 Iteration 80, loss = 0.0200 --- Epoch 75 / 1000 Iteration 0, loss = 0.0234 Iteration 20, loss = 0.0146 Iteration 40, loss = 0.0276 Iteration 60, loss = 0.0147 Iteration 80, loss = 0.0158 --- Epoch 76 / 1000 Iteration 0, loss = 0.0402 Iteration 20, loss = 0.0414 Iteration 40, loss = 0.0146 Iteration 60, loss = 0.0085 Iteration 80, loss = 0.0116 --- Epoch 77 / 1000 Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0352 Iteration 40, loss = 0.0217 Iteration 60, loss = 0.0284 Iteration 80, loss = 0.0333 --- Epoch 78 / 1000 Iteration 0, loss = 0.0128 Iteration 20, loss = 0.0296 Iteration 40, loss = 0.0223 Iteration 60, loss = 0.0283 Iteration 80, loss = 0.0173 --- Epoch 79 / 1000 Iteration 0, loss = 0.0083 Iteration 20, loss = 0.0282 Iteration 40, loss = 0.0213 Iteration 60, loss = 0.0223 Iteration 80, loss = 0.0111 --- Epoch 80 / 1000 Iteration 0, loss = 0.0166 Iteration 20, loss = 0.0182 Iteration 40, loss = 0.0265 Iteration 60, loss = 0.0206 Iteration 80, loss = 0.0160 --- Epoch 81 / 1000 Iteration 0, loss = 0.0097 Iteration 20, loss = 0.0244 Iteration 40, loss = 0.0366 Iteration 60, loss = 0.0275 Iteration 80, loss = 0.0168 --- Epoch 82 / 1000 Iteration 0, loss = 0.0146 Iteration 20, loss = 0.0141 Iteration 40, loss = 0.0137 Iteration 60, loss = 0.0203 Iteration 80, loss = 0.0145 --- Epoch 83 / 1000 Iteration 0, loss = 0.0151 Iteration 20, loss = 0.0154 Iteration 40, loss = 0.0114 Iteration 60, loss = 0.0173 Iteration 80, loss = 0.0102 --- Epoch 84 / 1000 Iteration 0, loss = 0.0300 Iteration 20, loss = 0.0242 Iteration 40, loss = 0.0274 Iteration 60, loss = 0.0142 Iteration 80, loss = 0.0153 --- Epoch 85 / 1000 Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0521 Iteration 40, loss = 0.0184 Iteration 60, loss = 0.0164 Iteration 80, loss = 0.0279 --- Epoch 86 / 1000 Iteration 0, loss = 0.0166 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0359 Iteration 60, loss = 0.0395 Iteration 80, loss = 0.0092 --- Epoch 87 / 1000 Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0201 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0270 Iteration 80, loss = 0.0391 --- Epoch 88 / 1000 Iteration 0, loss = 0.0467 Iteration 20, loss = 0.0372 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0252 Iteration 80, loss = 0.0214 --- Epoch 89 / 1000 Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0370 Iteration 40, loss = 0.0712 Iteration 60, loss = 0.0447 Iteration 80, loss = 0.0260 --- Epoch 90 / 1000 Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0293 Iteration 40, loss = 0.0201 Iteration 60, loss = 0.0237 Iteration 80, loss = 0.0448 --- Epoch 91 / 1000 Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0155 Iteration 40, loss = 0.0160 Iteration 60, loss = 0.0285 Iteration 80, loss = 0.0148 --- Epoch 92 / 1000 Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0239 Iteration 40, loss = 0.0360 Iteration 60, loss = 0.0147 Iteration 80, loss = 0.0181 --- Epoch 93 / 1000 Iteration 0, loss = 0.0542 Iteration 20, loss = 0.0222 Iteration 40, loss = 0.0165 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0276 --- Epoch 94 / 1000 Iteration 0, loss = 0.0227 Iteration 20, loss = 0.0256 Iteration 40, loss = 0.0363 Iteration 60, loss = 0.0137 Iteration 80, loss = 0.0120 --- Epoch 95 / 1000 Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0208 Iteration 40, loss = 0.0690 Iteration 60, loss = 0.0734 Iteration 80, loss = 0.0271 --- Epoch 96 / 1000 Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0413 Iteration 40, loss = 0.0204 Iteration 60, loss = 0.0184 Iteration 80, loss = 0.0166 --- Epoch 97 / 1000 Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0131 Iteration 40, loss = 0.0305 Iteration 60, loss = 0.0197 Iteration 80, loss = 0.0320 --- Epoch 98 / 1000 Iteration 0, loss = 0.0180 Iteration 20, loss = 0.0285 Iteration 40, loss = 0.0187 Iteration 60, loss = 0.0166 Iteration 80, loss = 0.0182 --- Epoch 99 / 1000 Iteration 0, loss = 0.0269 Iteration 20, loss = 0.0114 Iteration 40, loss = 0.0361 Iteration 60, loss = 0.0385 Iteration 80, loss = 0.0142 --- Epoch 100 / 1000 Iteration 0, loss = 0.0228 Iteration 20, loss = 0.0201 Iteration 40, loss = 0.0283 Iteration 60, loss = 0.0155 Iteration 80, loss = 0.0294 --- Epoch 101 / 1000 Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0224 Iteration 40, loss = 0.0237 Iteration 60, loss = 0.0169 Iteration 80, loss = 0.0183 --- Epoch 102 / 1000 Iteration 0, loss = 0.0196 Iteration 20, loss = 0.0416 Iteration 40, loss = 0.0177 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0168 --- Epoch 103 / 1000 Iteration 0, loss = 0.0202 Iteration 20, loss = 0.0207 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0267 --- Epoch 104 / 1000 Iteration 0, loss = 0.0382 Iteration 20, loss = 0.0187 Iteration 40, loss = 0.0205 Iteration 60, loss = 0.0180 Iteration 80, loss = 0.0181 --- Epoch 105 / 1000 Iteration 0, loss = 0.0194 Iteration 20, loss = 0.0241 Iteration 40, loss = 0.0272 Iteration 60, loss = 0.0337 Iteration 80, loss = 0.0334 --- Epoch 106 / 1000 Iteration 0, loss = 0.0300 Iteration 20, loss = 0.0127 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0927 --- Epoch 107 / 1000 Iteration 0, loss = 0.0250 Iteration 20, loss = 0.0132 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0352 Iteration 80, loss = 0.0198 --- Epoch 108 / 1000 Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0213 Iteration 40, loss = 0.0570 Iteration 60, loss = 0.0148 Iteration 80, loss = 0.0147 --- Epoch 109 / 1000 Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0108 Iteration 40, loss = 0.0142 Iteration 60, loss = 0.0420 Iteration 80, loss = 0.0142 --- Epoch 110 / 1000 Iteration 0, loss = 0.0169 Iteration 20, loss = 0.0265 Iteration 40, loss = 0.0638 Iteration 60, loss = 0.0171 Iteration 80, loss = 0.0241 --- Epoch 111 / 1000 Iteration 0, loss = 0.0203 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0106 Iteration 60, loss = 0.0307 Iteration 80, loss = 0.0338 --- Epoch 112 / 1000 Iteration 0, loss = 0.0356 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0212 Iteration 60, loss = 0.0354 Iteration 80, loss = 0.0288 --- Epoch 113 / 1000 Iteration 0, loss = 0.0254 Iteration 20, loss = 0.0233 Iteration 40, loss = 0.0313 Iteration 60, loss = 0.0150 Iteration 80, loss = 0.0222 --- Epoch 114 / 1000 Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0140 Iteration 40, loss = 0.0222 Iteration 60, loss = 0.0085 Iteration 80, loss = 0.0261 --- Epoch 115 / 1000 Iteration 0, loss = 0.0159 Iteration 20, loss = 0.0106 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0191 Iteration 80, loss = 0.0209 --- Epoch 116 / 1000 Iteration 0, loss = 0.0300 Iteration 20, loss = 0.0249 Iteration 40, loss = 0.0142 Iteration 60, loss = 0.0459 Iteration 80, loss = 0.0109 --- Epoch 117 / 1000 Iteration 0, loss = 0.0176 Iteration 20, loss = 0.0265 Iteration 40, loss = 0.0221 Iteration 60, loss = 0.0160 Iteration 80, loss = 0.0171 --- Epoch 118 / 1000 Iteration 0, loss = 0.0171 Iteration 20, loss = 0.0378 Iteration 40, loss = 0.0164 Iteration 60, loss = 0.0121 Iteration 80, loss = 0.0188 --- Epoch 119 / 1000 Iteration 0, loss = 0.0280 Iteration 20, loss = 0.0366 Iteration 40, loss = 0.0196 Iteration 60, loss = 0.0166 Iteration 80, loss = 0.0177 --- Epoch 120 / 1000 Iteration 0, loss = 0.0197 Iteration 20, loss = 0.0171 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0167 Iteration 80, loss = 0.0121 --- Epoch 121 / 1000 Iteration 0, loss = 0.0181 Iteration 20, loss = 0.0149 Iteration 40, loss = 0.0112 Iteration 60, loss = 0.0249 Iteration 80, loss = 0.0279 --- Epoch 122 / 1000 Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0177 Iteration 40, loss = 0.0218 Iteration 60, loss = 0.0145 Iteration 80, loss = 0.0264 --- Epoch 123 / 1000 Iteration 0, loss = 0.0191 Iteration 20, loss = 0.0269 Iteration 40, loss = 0.0081 Iteration 60, loss = 0.0213 Iteration 80, loss = 0.0204 --- Epoch 124 / 1000 Iteration 0, loss = 0.0162 Iteration 20, loss = 0.0190 Iteration 40, loss = 0.0193 Iteration 60, loss = 0.0198 Iteration 80, loss = 0.0142 --- Epoch 125 / 1000 Iteration 0, loss = 0.0294 Iteration 20, loss = 0.0159 Iteration 40, loss = 0.0147 Iteration 60, loss = 0.0283 Iteration 80, loss = 0.0144 --- Epoch 126 / 1000 Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0528 Iteration 80, loss = 0.0291 --- Epoch 127 / 1000 Iteration 0, loss = 0.0199 Iteration 20, loss = 0.0282 Iteration 40, loss = 0.0162 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0141 --- Epoch 128 / 1000 Iteration 0, loss = 0.0223 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0117 Iteration 80, loss = 0.0251 --- Epoch 129 / 1000 Iteration 0, loss = 0.0214 Iteration 20, loss = 0.0169 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0159 Iteration 80, loss = 0.0223 --- Epoch 130 / 1000 Iteration 0, loss = 0.0135 Iteration 20, loss = 0.0350 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0156 Iteration 80, loss = 0.0175 --- Epoch 131 / 1000 Iteration 0, loss = 0.0166 Iteration 20, loss = 0.0340 Iteration 40, loss = 0.0373 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0313 --- Epoch 132 / 1000 Iteration 0, loss = 0.0181 Iteration 20, loss = 0.0203 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0389 --- Epoch 133 / 1000 Iteration 0, loss = 0.0176 Iteration 20, loss = 0.0111 Iteration 40, loss = 0.0110 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0163 --- Epoch 134 / 1000 Iteration 0, loss = 0.0269 Iteration 20, loss = 0.0186 Iteration 40, loss = 0.0206 Iteration 60, loss = 0.0199 Iteration 80, loss = 0.0087 --- Epoch 135 / 1000 Iteration 0, loss = 0.0334 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0118 Iteration 60, loss = 0.0356 Iteration 80, loss = 0.0124 --- Epoch 136 / 1000 Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0254 Iteration 40, loss = 0.0158 Iteration 60, loss = 0.0143 Iteration 80, loss = 0.0106 --- Epoch 137 / 1000 Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0189 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0137 --- Epoch 138 / 1000 Iteration 0, loss = 0.0220 Iteration 20, loss = 0.0375 Iteration 40, loss = 0.0208 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0273 --- Epoch 139 / 1000 Iteration 0, loss = 0.0169 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0300 Iteration 80, loss = 0.0175 --- Epoch 140 / 1000 Iteration 0, loss = 0.0137 Iteration 20, loss = 0.0206 Iteration 40, loss = 0.0150 Iteration 60, loss = 0.0169 Iteration 80, loss = 0.0199 --- Epoch 141 / 1000 Iteration 0, loss = 0.0212 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0092 Iteration 60, loss = 0.0250 Iteration 80, loss = 0.0094 --- Epoch 142 / 1000 Iteration 0, loss = 0.0152 Iteration 20, loss = 0.0643 Iteration 40, loss = 0.0128 Iteration 60, loss = 0.0276 Iteration 80, loss = 0.0137 --- Epoch 143 / 1000 Iteration 0, loss = 0.0249 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0224 Iteration 80, loss = 0.0120 --- Epoch 144 / 1000 Iteration 0, loss = 0.0217 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0207 Iteration 60, loss = 0.0132 Iteration 80, loss = 0.0059 --- Epoch 145 / 1000 Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0177 Iteration 40, loss = 0.0238 Iteration 60, loss = 0.0155 Iteration 80, loss = 0.0144 --- Epoch 146 / 1000 Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0379 Iteration 40, loss = 0.0216 Iteration 60, loss = 0.0226 Iteration 80, loss = 0.0591 --- Epoch 147 / 1000 Iteration 0, loss = 0.0270 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0200 Iteration 80, loss = 0.0238 --- Epoch 148 / 1000 Iteration 0, loss = 0.0383 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0175 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0155 --- Epoch 149 / 1000 Iteration 0, loss = 0.0145 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0106 Iteration 60, loss = 0.0248 Iteration 80, loss = 0.0245 --- Epoch 150 / 1000 Iteration 0, loss = 0.0280 Iteration 20, loss = 0.0184 Iteration 40, loss = 0.0176 Iteration 60, loss = 0.0182 Iteration 80, loss = 0.0132 --- Epoch 151 / 1000 Iteration 0, loss = 0.0090 Iteration 20, loss = 0.0177 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0260 Iteration 80, loss = 0.0073 --- Epoch 152 / 1000 Iteration 0, loss = 0.0175 Iteration 20, loss = 0.0149 Iteration 40, loss = 0.0165 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0228 --- Epoch 153 / 1000 Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0145 Iteration 40, loss = 0.0229 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0234 --- Epoch 154 / 1000 Iteration 0, loss = 0.0204 Iteration 20, loss = 0.0185 Iteration 40, loss = 0.0160 Iteration 60, loss = 0.0132 Iteration 80, loss = 0.0131 --- Epoch 155 / 1000 Iteration 0, loss = 0.0228 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0237 Iteration 80, loss = 0.0104 --- Epoch 156 / 1000 Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0370 Iteration 40, loss = 0.0170 Iteration 60, loss = 0.0217 Iteration 80, loss = 0.0153 --- Epoch 157 / 1000 Iteration 0, loss = 0.0184 Iteration 20, loss = 0.0155 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0199 Iteration 80, loss = 0.0119 --- Epoch 158 / 1000 Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0164 Iteration 40, loss = 0.0101 Iteration 60, loss = 0.0160 Iteration 80, loss = 0.0396 --- Epoch 159 / 1000 Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0238 Iteration 60, loss = 0.0293 Iteration 80, loss = 0.0063 --- Epoch 160 / 1000 Iteration 0, loss = 0.0252 Iteration 20, loss = 0.0167 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0262 --- Epoch 161 / 1000 Iteration 0, loss = 0.0194 Iteration 20, loss = 0.0164 Iteration 40, loss = 0.0148 Iteration 60, loss = 0.0281 Iteration 80, loss = 0.0145 --- Epoch 162 / 1000 Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0126 Iteration 40, loss = 0.0260 Iteration 60, loss = 0.0153 Iteration 80, loss = 0.0364 --- Epoch 163 / 1000 Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0111 Iteration 40, loss = 0.0160 Iteration 60, loss = 0.0143 Iteration 80, loss = 0.0066 --- Epoch 164 / 1000 Iteration 0, loss = 0.0145 Iteration 20, loss = 0.0106 Iteration 40, loss = 0.0101 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0118 --- Epoch 165 / 1000 Iteration 0, loss = 0.0304 Iteration 20, loss = 0.0169 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0185 Iteration 80, loss = 0.0248 --- Epoch 166 / 1000 Iteration 0, loss = 0.0162 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0176 Iteration 60, loss = 0.0192 Iteration 80, loss = 0.0245 --- Epoch 167 / 1000 Iteration 0, loss = 0.0245 Iteration 20, loss = 0.0181 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0337 Iteration 80, loss = 0.0207 --- Epoch 168 / 1000 Iteration 0, loss = 0.0191 Iteration 20, loss = 0.0278 Iteration 40, loss = 0.0101 Iteration 60, loss = 0.0141 Iteration 80, loss = 0.0073 --- Epoch 169 / 1000 Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0262 Iteration 60, loss = 0.0190 Iteration 80, loss = 0.0077 --- Epoch 170 / 1000 Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0335 Iteration 40, loss = 0.0314 Iteration 60, loss = 0.0140 Iteration 80, loss = 0.0268 --- Epoch 171 / 1000 Iteration 0, loss = 0.0101 Iteration 20, loss = 0.0154 Iteration 40, loss = 0.0108 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0156 --- Epoch 172 / 1000 Iteration 0, loss = 0.0191 Iteration 20, loss = 0.0230 Iteration 40, loss = 0.0145 Iteration 60, loss = 0.0316 Iteration 80, loss = 0.0074 --- Epoch 173 / 1000 Iteration 0, loss = 0.0232 Iteration 20, loss = 0.0144 Iteration 40, loss = 0.0460 Iteration 60, loss = 0.0155 Iteration 80, loss = 0.0123 --- Epoch 174 / 1000 Iteration 0, loss = 0.0126 Iteration 20, loss = 0.0222 Iteration 40, loss = 0.0188 Iteration 60, loss = 0.0230 Iteration 80, loss = 0.0069 --- Epoch 175 / 1000 Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0137 Iteration 60, loss = 0.0151 Iteration 80, loss = 0.0121 --- Epoch 176 / 1000 Iteration 0, loss = 0.0166 Iteration 20, loss = 0.0241 Iteration 40, loss = 0.0164 Iteration 60, loss = 0.0153 Iteration 80, loss = 0.0182 --- Epoch 177 / 1000 Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0307 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0140 Iteration 80, loss = 0.0159 --- Epoch 178 / 1000 Iteration 0, loss = 0.0263 Iteration 20, loss = 0.0155 Iteration 40, loss = 0.0272 Iteration 60, loss = 0.0201 Iteration 80, loss = 0.0059 --- Epoch 179 / 1000 Iteration 0, loss = 0.0123 Iteration 20, loss = 0.0162 Iteration 40, loss = 0.0110 Iteration 60, loss = 0.0307 Iteration 80, loss = 0.0049 --- Epoch 180 / 1000 Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0127 Iteration 80, loss = 0.0112 --- Epoch 181 / 1000 Iteration 0, loss = 0.0192 Iteration 20, loss = 0.0108 Iteration 40, loss = 0.0206 Iteration 60, loss = 0.0114 Iteration 80, loss = 0.0184 --- Epoch 182 / 1000 Iteration 0, loss = 0.0192 Iteration 20, loss = 0.0307 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0128 --- Epoch 183 / 1000 Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0293 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0131 Iteration 80, loss = 0.0149 --- Epoch 184 / 1000 Iteration 0, loss = 0.0146 Iteration 20, loss = 0.0228 Iteration 40, loss = 0.0303 Iteration 60, loss = 0.0160 Iteration 80, loss = 0.0105 --- Epoch 185 / 1000 Iteration 0, loss = 0.0090 Iteration 20, loss = 0.0146 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0165 Iteration 80, loss = 0.0125 --- Epoch 186 / 1000 Iteration 0, loss = 0.0440 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0121 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0230 --- Epoch 187 / 1000 Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0193 Iteration 60, loss = 0.0202 Iteration 80, loss = 0.0107 --- Epoch 188 / 1000 Iteration 0, loss = 0.0127 Iteration 20, loss = 0.0243 Iteration 40, loss = 0.0134 Iteration 60, loss = 0.0266 Iteration 80, loss = 0.0328 --- Epoch 189 / 1000 Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0266 Iteration 60, loss = 0.0130 Iteration 80, loss = 0.0060 --- Epoch 190 / 1000 Iteration 0, loss = 0.0113 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0161 --- Epoch 191 / 1000 Iteration 0, loss = 0.0304 Iteration 20, loss = 0.0183 Iteration 40, loss = 0.0206 Iteration 60, loss = 0.0115 Iteration 80, loss = 0.0063 --- Epoch 192 / 1000 Iteration 0, loss = 0.0220 Iteration 20, loss = 0.0219 Iteration 40, loss = 0.0113 Iteration 60, loss = 0.0139 Iteration 80, loss = 0.0161 --- Epoch 193 / 1000 Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0196 Iteration 40, loss = 0.0212 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0311 --- Epoch 194 / 1000 Iteration 0, loss = 0.0276 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0115 Iteration 80, loss = 0.0208 --- Epoch 195 / 1000 Iteration 0, loss = 0.0221 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0192 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0159 --- Epoch 196 / 1000 Iteration 0, loss = 0.0167 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0155 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0127 --- Epoch 197 / 1000 Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0081 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0164 --- Epoch 198 / 1000 Iteration 0, loss = 0.0259 Iteration 20, loss = 0.0160 Iteration 40, loss = 0.0202 Iteration 60, loss = 0.0126 Iteration 80, loss = 0.0210 --- Epoch 199 / 1000 Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0284 Iteration 40, loss = 0.0142 Iteration 60, loss = 0.0247 Iteration 80, loss = 0.0133 --- Epoch 200 / 1000 Iteration 0, loss = 0.0469 Iteration 20, loss = 0.0213 Iteration 40, loss = 0.0273 Iteration 60, loss = 0.0190 Iteration 80, loss = 0.0060 --- Epoch 201 / 1000 Iteration 0, loss = 0.0140 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0141 Iteration 60, loss = 0.0148 Iteration 80, loss = 0.0084 --- Epoch 202 / 1000 Iteration 0, loss = 0.0070 Iteration 20, loss = 0.0184 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0130 Iteration 80, loss = 0.0161 --- Epoch 203 / 1000 Iteration 0, loss = 0.0090 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0271 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0040 --- Epoch 204 / 1000 Iteration 0, loss = 0.0173 Iteration 20, loss = 0.0175 Iteration 40, loss = 0.0192 Iteration 60, loss = 0.0202 Iteration 80, loss = 0.0169 --- Epoch 205 / 1000 Iteration 0, loss = 0.0246 Iteration 20, loss = 0.0096 Iteration 40, loss = 0.0195 Iteration 60, loss = 0.0101 Iteration 80, loss = 0.0103 --- Epoch 206 / 1000 Iteration 0, loss = 0.0179 Iteration 20, loss = 0.0162 Iteration 40, loss = 0.0189 Iteration 60, loss = 0.0096 Iteration 80, loss = 0.0248 --- Epoch 207 / 1000 Iteration 0, loss = 0.0238 Iteration 20, loss = 0.0155 Iteration 40, loss = 0.0245 Iteration 60, loss = 0.0267 Iteration 80, loss = 0.0070 --- Epoch 208 / 1000 Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0126 Iteration 60, loss = 0.0175 Iteration 80, loss = 0.0144 --- Epoch 209 / 1000 Iteration 0, loss = 0.0298 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0256 Iteration 60, loss = 0.0217 Iteration 80, loss = 0.0206 --- Epoch 210 / 1000 Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0136 Iteration 40, loss = 0.0147 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0139 --- Epoch 211 / 1000 Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0232 Iteration 40, loss = 0.0185 Iteration 60, loss = 0.0180 Iteration 80, loss = 0.0102 --- Epoch 212 / 1000 Iteration 0, loss = 0.0171 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0264 Iteration 60, loss = 0.0139 Iteration 80, loss = 0.0261 --- Epoch 213 / 1000 Iteration 0, loss = 0.0229 Iteration 20, loss = 0.0312 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0297 Iteration 80, loss = 0.0051 --- Epoch 214 / 1000 Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0128 Iteration 40, loss = 0.0150 Iteration 60, loss = 0.0196 Iteration 80, loss = 0.0158 --- Epoch 215 / 1000 Iteration 0, loss = 0.0205 Iteration 20, loss = 0.0127 Iteration 40, loss = 0.0268 Iteration 60, loss = 0.0233 Iteration 80, loss = 0.0079 --- Epoch 216 / 1000 Iteration 0, loss = 0.0085 Iteration 20, loss = 0.0308 Iteration 40, loss = 0.0163 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0090 --- Epoch 217 / 1000 Iteration 0, loss = 0.0237 Iteration 20, loss = 0.0301 Iteration 40, loss = 0.0296 Iteration 60, loss = 0.0244 Iteration 80, loss = 0.0180 --- Epoch 218 / 1000 Iteration 0, loss = 0.0538 Iteration 20, loss = 0.0220 Iteration 40, loss = 0.0106 Iteration 60, loss = 0.0116 Iteration 80, loss = 0.0265 --- Epoch 219 / 1000 Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0236 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0164 Iteration 80, loss = 0.0149 --- Epoch 220 / 1000 Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0134 Iteration 40, loss = 0.0145 Iteration 60, loss = 0.0152 Iteration 80, loss = 0.0120 --- Epoch 221 / 1000 Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0179 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0272 Iteration 80, loss = 0.0098 --- Epoch 222 / 1000 Iteration 0, loss = 0.0100 Iteration 20, loss = 0.0266 Iteration 40, loss = 0.0186 Iteration 60, loss = 0.0237 Iteration 80, loss = 0.0101 --- Epoch 223 / 1000 Iteration 0, loss = 0.0256 Iteration 20, loss = 0.0141 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0065 --- Epoch 224 / 1000 Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0229 Iteration 40, loss = 0.0201 Iteration 60, loss = 0.0190 Iteration 80, loss = 0.0219 --- Epoch 225 / 1000 Iteration 0, loss = 0.0222 Iteration 20, loss = 0.0282 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0220 Iteration 80, loss = 0.0170 --- Epoch 226 / 1000 Iteration 0, loss = 0.0204 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0179 Iteration 60, loss = 0.0134 Iteration 80, loss = 0.0075 --- Epoch 227 / 1000 Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0240 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0191 Iteration 80, loss = 0.0167 --- Epoch 228 / 1000 Iteration 0, loss = 0.0162 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0166 Iteration 60, loss = 0.0178 Iteration 80, loss = 0.0075 --- Epoch 229 / 1000 Iteration 0, loss = 0.0141 Iteration 20, loss = 0.0133 Iteration 40, loss = 0.0213 Iteration 60, loss = 0.0248 Iteration 80, loss = 0.0092 --- Epoch 230 / 1000 Iteration 0, loss = 0.0136 Iteration 20, loss = 0.0198 Iteration 40, loss = 0.0220 Iteration 60, loss = 0.0225 Iteration 80, loss = 0.0095 --- Epoch 231 / 1000 Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0265 Iteration 40, loss = 0.0133 Iteration 60, loss = 0.0215 Iteration 80, loss = 0.0288 --- Epoch 232 / 1000 Iteration 0, loss = 0.0196 Iteration 20, loss = 0.0114 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0197 Iteration 80, loss = 0.0120 --- Epoch 233 / 1000 Iteration 0, loss = 0.0237 Iteration 20, loss = 0.0243 Iteration 40, loss = 0.0146 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0215 --- Epoch 234 / 1000 Iteration 0, loss = 0.0184 Iteration 20, loss = 0.0145 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0221 Iteration 80, loss = 0.0166 --- Epoch 235 / 1000 Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0207 Iteration 40, loss = 0.0217 Iteration 60, loss = 0.0135 Iteration 80, loss = 0.0160 --- Epoch 236 / 1000 Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0090 Iteration 40, loss = 0.0236 Iteration 60, loss = 0.0135 Iteration 80, loss = 0.0201 --- Epoch 237 / 1000 Iteration 0, loss = 0.0232 Iteration 20, loss = 0.0165 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0093 --- Epoch 238 / 1000 Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0177 Iteration 40, loss = 0.0089 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0105 --- Epoch 239 / 1000 Iteration 0, loss = 0.0123 Iteration 20, loss = 0.0262 Iteration 40, loss = 0.0404 Iteration 60, loss = 0.0362 Iteration 80, loss = 0.0149 --- Epoch 240 / 1000 Iteration 0, loss = 0.0219 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0133 Iteration 60, loss = 0.0220 Iteration 80, loss = 0.0100 --- Epoch 241 / 1000 Iteration 0, loss = 0.0170 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0166 Iteration 80, loss = 0.0144 --- Epoch 242 / 1000 Iteration 0, loss = 0.0230 Iteration 20, loss = 0.0159 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0177 Iteration 80, loss = 0.0113 --- Epoch 243 / 1000 Iteration 0, loss = 0.0202 Iteration 20, loss = 0.0146 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0152 Iteration 80, loss = 0.0061 --- Epoch 244 / 1000 Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0208 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0215 Iteration 80, loss = 0.0092 --- Epoch 245 / 1000 Iteration 0, loss = 0.0185 Iteration 20, loss = 0.0276 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0099 --- Epoch 246 / 1000 Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0135 Iteration 80, loss = 0.0189 --- Epoch 247 / 1000 Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0120 Iteration 60, loss = 0.0198 Iteration 80, loss = 0.0210 --- Epoch 248 / 1000 Iteration 0, loss = 0.0135 Iteration 20, loss = 0.0148 Iteration 40, loss = 0.0134 Iteration 60, loss = 0.0136 Iteration 80, loss = 0.0217 --- Epoch 249 / 1000 Iteration 0, loss = 0.0266 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0198 Iteration 60, loss = 0.0244 Iteration 80, loss = 0.0160 --- Epoch 250 / 1000 Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0201 Iteration 40, loss = 0.0355 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0152 --- Epoch 251 / 1000 Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0283 Iteration 40, loss = 0.0159 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0103 --- Epoch 252 / 1000 Iteration 0, loss = 0.0180 Iteration 20, loss = 0.0150 Iteration 40, loss = 0.0175 Iteration 60, loss = 0.0124 Iteration 80, loss = 0.0175 --- Epoch 253 / 1000 Iteration 0, loss = 0.0159 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0252 --- Epoch 254 / 1000 Iteration 0, loss = 0.0113 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0081 Iteration 60, loss = 0.0157 Iteration 80, loss = 0.0092 --- Epoch 255 / 1000 Iteration 0, loss = 0.0236 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0261 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0078 --- Epoch 256 / 1000 Iteration 0, loss = 0.0161 Iteration 20, loss = 0.0151 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0181 Iteration 80, loss = 0.0109 --- Epoch 257 / 1000 Iteration 0, loss = 0.0181 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0205 Iteration 60, loss = 0.0290 Iteration 80, loss = 0.0107 --- Epoch 258 / 1000 Iteration 0, loss = 0.0097 Iteration 20, loss = 0.0116 Iteration 40, loss = 0.0137 Iteration 60, loss = 0.0120 Iteration 80, loss = 0.0153 --- Epoch 259 / 1000 Iteration 0, loss = 0.0135 Iteration 20, loss = 0.0253 Iteration 40, loss = 0.0175 Iteration 60, loss = 0.0205 Iteration 80, loss = 0.0199 --- Epoch 260 / 1000 Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0286 Iteration 40, loss = 0.0129 Iteration 60, loss = 0.0216 Iteration 80, loss = 0.0232 --- Epoch 261 / 1000 Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0155 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0131 --- Epoch 262 / 1000 Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0181 Iteration 40, loss = 0.0133 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0137 --- Epoch 263 / 1000 Iteration 0, loss = 0.0203 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0337 Iteration 60, loss = 0.0099 Iteration 80, loss = 0.0056 --- Epoch 264 / 1000 Iteration 0, loss = 0.0312 Iteration 20, loss = 0.0090 Iteration 40, loss = 0.0168 Iteration 60, loss = 0.0228 Iteration 80, loss = 0.0194 --- Epoch 265 / 1000 Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0135 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0236 --- Epoch 266 / 1000 Iteration 0, loss = 0.0155 Iteration 20, loss = 0.0186 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0117 Iteration 80, loss = 0.0111 --- Epoch 267 / 1000 Iteration 0, loss = 0.0168 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0048 --- Epoch 268 / 1000 Iteration 0, loss = 0.0127 Iteration 20, loss = 0.0193 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0277 --- Epoch 269 / 1000 Iteration 0, loss = 0.0232 Iteration 20, loss = 0.0270 Iteration 40, loss = 0.0139 Iteration 60, loss = 0.0187 Iteration 80, loss = 0.0129 --- Epoch 270 / 1000 Iteration 0, loss = 0.0186 Iteration 20, loss = 0.0209 Iteration 40, loss = 0.0183 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0120 --- Epoch 271 / 1000 Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0201 Iteration 40, loss = 0.0128 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0118 --- Epoch 272 / 1000 Iteration 0, loss = 0.0131 Iteration 20, loss = 0.0114 Iteration 40, loss = 0.0208 Iteration 60, loss = 0.0085 Iteration 80, loss = 0.0174 --- Epoch 273 / 1000 Iteration 0, loss = 0.0133 Iteration 20, loss = 0.0131 Iteration 40, loss = 0.0134 Iteration 60, loss = 0.0183 Iteration 80, loss = 0.0300 --- Epoch 274 / 1000 Iteration 0, loss = 0.0212 Iteration 20, loss = 0.0179 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0056 --- Epoch 275 / 1000 Iteration 0, loss = 0.0126 Iteration 20, loss = 0.0252 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0070 --- Epoch 276 / 1000 Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0165 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0215 Iteration 80, loss = 0.0168 --- Epoch 277 / 1000 Iteration 0, loss = 0.0131 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0260 Iteration 60, loss = 0.0117 Iteration 80, loss = 0.0129 --- Epoch 278 / 1000 Iteration 0, loss = 0.0178 Iteration 20, loss = 0.0166 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0350 Iteration 80, loss = 0.0546 --- Epoch 279 / 1000 Iteration 0, loss = 0.0159 Iteration 20, loss = 0.0236 Iteration 40, loss = 0.0084 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0077 --- Epoch 280 / 1000 Iteration 0, loss = 0.0335 Iteration 20, loss = 0.0241 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0282 --- Epoch 281 / 1000 Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0132 Iteration 80, loss = 0.0224 --- Epoch 282 / 1000 Iteration 0, loss = 0.0229 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0165 Iteration 60, loss = 0.0221 Iteration 80, loss = 0.0082 --- Epoch 283 / 1000 Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0193 Iteration 60, loss = 0.0174 Iteration 80, loss = 0.0182 --- Epoch 284 / 1000 Iteration 0, loss = 0.0372 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0277 Iteration 60, loss = 0.0160 Iteration 80, loss = 0.0079 --- Epoch 285 / 1000 Iteration 0, loss = 0.0237 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0135 Iteration 80, loss = 0.0179 --- Epoch 286 / 1000 Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0209 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0247 Iteration 80, loss = 0.0087 --- Epoch 287 / 1000 Iteration 0, loss = 0.0344 Iteration 20, loss = 0.0140 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0325 Iteration 80, loss = 0.0127 --- Epoch 288 / 1000 Iteration 0, loss = 0.0402 Iteration 20, loss = 0.0140 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0080 --- Epoch 289 / 1000 Iteration 0, loss = 0.0147 Iteration 20, loss = 0.0096 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0166 Iteration 80, loss = 0.0152 --- Epoch 290 / 1000 Iteration 0, loss = 0.0172 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0131 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0154 --- Epoch 291 / 1000 Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0159 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0168 --- Epoch 292 / 1000 Iteration 0, loss = 0.0157 Iteration 20, loss = 0.0188 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0224 Iteration 80, loss = 0.0142 --- Epoch 293 / 1000 Iteration 0, loss = 0.0289 Iteration 20, loss = 0.0259 Iteration 40, loss = 0.0168 Iteration 60, loss = 0.0370 Iteration 80, loss = 0.0158 --- Epoch 294 / 1000 Iteration 0, loss = 0.0210 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0247 Iteration 80, loss = 0.0246 --- Epoch 295 / 1000 Iteration 0, loss = 0.0084 Iteration 20, loss = 0.0176 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0173 Iteration 80, loss = 0.0089 --- Epoch 296 / 1000 Iteration 0, loss = 0.0162 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0154 Iteration 80, loss = 0.0064 --- Epoch 297 / 1000 Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0152 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0119 --- Epoch 298 / 1000 Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0186 Iteration 40, loss = 0.0142 Iteration 60, loss = 0.0302 Iteration 80, loss = 0.0127 --- Epoch 299 / 1000 Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0201 Iteration 80, loss = 0.0175 --- Epoch 300 / 1000 Iteration 0, loss = 0.0141 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0202 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0190 --- Epoch 301 / 1000 Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0136 Iteration 40, loss = 0.0231 Iteration 60, loss = 0.0140 Iteration 80, loss = 0.0142 --- Epoch 302 / 1000 Iteration 0, loss = 0.0133 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0154 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0137 --- Epoch 303 / 1000 Iteration 0, loss = 0.0194 Iteration 20, loss = 0.0133 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0111 --- Epoch 304 / 1000 Iteration 0, loss = 0.0123 Iteration 20, loss = 0.0386 Iteration 40, loss = 0.0202 Iteration 60, loss = 0.0135 Iteration 80, loss = 0.0303 --- Epoch 305 / 1000 Iteration 0, loss = 0.0163 Iteration 20, loss = 0.0195 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0187 Iteration 80, loss = 0.0164 --- Epoch 306 / 1000 Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0150 Iteration 40, loss = 0.0163 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0060 --- Epoch 307 / 1000 Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0135 Iteration 80, loss = 0.0025 --- Epoch 308 / 1000 Iteration 0, loss = 0.0272 Iteration 20, loss = 0.0133 Iteration 40, loss = 0.0147 Iteration 60, loss = 0.0144 Iteration 80, loss = 0.0179 --- Epoch 309 / 1000 Iteration 0, loss = 0.0277 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0181 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0047 --- Epoch 310 / 1000 Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0144 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0205 --- Epoch 311 / 1000 Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0137 Iteration 60, loss = 0.0172 Iteration 80, loss = 0.0197 --- Epoch 312 / 1000 Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0113 Iteration 80, loss = 0.0130 --- Epoch 313 / 1000 Iteration 0, loss = 0.0190 Iteration 20, loss = 0.0161 Iteration 40, loss = 0.0208 Iteration 60, loss = 0.0214 Iteration 80, loss = 0.0053 --- Epoch 314 / 1000 Iteration 0, loss = 0.0145 Iteration 20, loss = 0.0106 Iteration 40, loss = 0.0161 Iteration 60, loss = 0.0202 Iteration 80, loss = 0.0238 --- Epoch 315 / 1000 Iteration 0, loss = 0.0204 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0303 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0205 --- Epoch 316 / 1000 Iteration 0, loss = 0.0221 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0194 Iteration 60, loss = 0.0120 Iteration 80, loss = 0.0189 --- Epoch 317 / 1000 Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0136 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0232 Iteration 80, loss = 0.0214 --- Epoch 318 / 1000 Iteration 0, loss = 0.0144 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0184 Iteration 80, loss = 0.0049 --- Epoch 319 / 1000 Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0112 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0175 Iteration 80, loss = 0.0059 --- Epoch 320 / 1000 Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0224 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0204 --- Epoch 321 / 1000 Iteration 0, loss = 0.0277 Iteration 20, loss = 0.0209 Iteration 40, loss = 0.0225 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0096 --- Epoch 322 / 1000 Iteration 0, loss = 0.0149 Iteration 20, loss = 0.0179 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0180 Iteration 80, loss = 0.0133 --- Epoch 323 / 1000 Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0132 Iteration 60, loss = 0.0156 Iteration 80, loss = 0.0084 --- Epoch 324 / 1000 Iteration 0, loss = 0.0145 Iteration 20, loss = 0.0192 Iteration 40, loss = 0.0262 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0457 --- Epoch 325 / 1000 Iteration 0, loss = 0.0150 Iteration 20, loss = 0.0275 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0222 Iteration 80, loss = 0.0145 --- Epoch 326 / 1000 Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0111 Iteration 40, loss = 0.0106 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0210 --- Epoch 327 / 1000 Iteration 0, loss = 0.0104 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0232 Iteration 60, loss = 0.0125 Iteration 80, loss = 0.0197 --- Epoch 328 / 1000 Iteration 0, loss = 0.0551 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0192 Iteration 60, loss = 0.0187 Iteration 80, loss = 0.0150 --- Epoch 329 / 1000 Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0173 Iteration 40, loss = 0.0093 Iteration 60, loss = 0.0243 Iteration 80, loss = 0.0179 --- Epoch 330 / 1000 Iteration 0, loss = 0.0157 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0104 --- Epoch 331 / 1000 Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0197 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0175 Iteration 80, loss = 0.0085 --- Epoch 332 / 1000 Iteration 0, loss = 0.0096 Iteration 20, loss = 0.0308 Iteration 40, loss = 0.0318 Iteration 60, loss = 0.0240 Iteration 80, loss = 0.0181 --- Epoch 333 / 1000 Iteration 0, loss = 0.0103 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0206 Iteration 60, loss = 0.0134 Iteration 80, loss = 0.0115 --- Epoch 334 / 1000 Iteration 0, loss = 0.0307 Iteration 20, loss = 0.0131 Iteration 40, loss = 0.0375 Iteration 60, loss = 0.0186 Iteration 80, loss = 0.0177 --- Epoch 335 / 1000 Iteration 0, loss = 0.0137 Iteration 20, loss = 0.0307 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0162 --- Epoch 336 / 1000 Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0070 --- Epoch 337 / 1000 Iteration 0, loss = 0.0133 Iteration 20, loss = 0.0115 Iteration 40, loss = 0.0277 Iteration 60, loss = 0.0148 Iteration 80, loss = 0.0099 --- Epoch 338 / 1000 Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0185 Iteration 60, loss = 0.0101 Iteration 80, loss = 0.0191 --- Epoch 339 / 1000 Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0168 --- Epoch 340 / 1000 Iteration 0, loss = 0.0194 Iteration 20, loss = 0.0314 Iteration 40, loss = 0.0157 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0079 --- Epoch 341 / 1000 Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0105 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0203 --- Epoch 342 / 1000 Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0366 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0095 --- Epoch 343 / 1000 Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0134 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0122 --- Epoch 344 / 1000 Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0182 Iteration 40, loss = 0.0919 Iteration 60, loss = 0.0258 Iteration 80, loss = 0.0122 --- Epoch 345 / 1000 Iteration 0, loss = 0.0110 Iteration 20, loss = 0.0128 Iteration 40, loss = 0.0221 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0086 --- Epoch 346 / 1000 Iteration 0, loss = 0.0197 Iteration 20, loss = 0.0131 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0093 --- Epoch 347 / 1000 Iteration 0, loss = 0.0179 Iteration 20, loss = 0.0179 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0202 Iteration 80, loss = 0.0127 --- Epoch 348 / 1000 Iteration 0, loss = 0.0138 Iteration 20, loss = 0.0111 Iteration 40, loss = 0.0160 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0186 --- Epoch 349 / 1000 Iteration 0, loss = 0.0147 Iteration 20, loss = 0.0087 Iteration 40, loss = 0.0120 Iteration 60, loss = 0.0204 Iteration 80, loss = 0.0260 --- Epoch 350 / 1000 Iteration 0, loss = 0.0090 Iteration 20, loss = 0.0325 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0124 Iteration 80, loss = 0.0147 --- Epoch 351 / 1000 Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0225 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0057 --- Epoch 352 / 1000 Iteration 0, loss = 0.0138 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0064 --- Epoch 353 / 1000 Iteration 0, loss = 0.0169 Iteration 20, loss = 0.0312 Iteration 40, loss = 0.0237 Iteration 60, loss = 0.0281 Iteration 80, loss = 0.0115 --- Epoch 354 / 1000 Iteration 0, loss = 0.0140 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0179 Iteration 80, loss = 0.0218 --- Epoch 355 / 1000 Iteration 0, loss = 0.0191 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0126 Iteration 80, loss = 0.0075 --- Epoch 356 / 1000 Iteration 0, loss = 0.0224 Iteration 20, loss = 0.0302 Iteration 40, loss = 0.0152 Iteration 60, loss = 0.0347 Iteration 80, loss = 0.0147 --- Epoch 357 / 1000 Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0105 --- Epoch 358 / 1000 Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0111 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0211 Iteration 80, loss = 0.0191 --- Epoch 359 / 1000 Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0262 Iteration 80, loss = 0.0050 --- Epoch 360 / 1000 Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0189 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0148 Iteration 80, loss = 0.0162 --- Epoch 361 / 1000 Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0090 Iteration 40, loss = 0.0332 Iteration 60, loss = 0.0302 Iteration 80, loss = 0.0122 --- Epoch 362 / 1000 Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0219 Iteration 80, loss = 0.0073 --- Epoch 363 / 1000 Iteration 0, loss = 0.0153 Iteration 20, loss = 0.0123 Iteration 40, loss = 0.0296 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0233 --- Epoch 364 / 1000 Iteration 0, loss = 0.0101 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0144 Iteration 80, loss = 0.0089 --- Epoch 365 / 1000 Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0247 Iteration 80, loss = 0.0143 --- Epoch 366 / 1000 Iteration 0, loss = 0.0148 Iteration 20, loss = 0.0129 Iteration 40, loss = 0.0164 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0155 --- Epoch 367 / 1000 Iteration 0, loss = 0.0158 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0104 --- Epoch 368 / 1000 Iteration 0, loss = 0.0130 Iteration 20, loss = 0.0126 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0102 Iteration 80, loss = 0.0045 --- Epoch 369 / 1000 Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0184 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0142 Iteration 80, loss = 0.0065 --- Epoch 370 / 1000 Iteration 0, loss = 0.0199 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0132 Iteration 60, loss = 0.0199 Iteration 80, loss = 0.0205 --- Epoch 371 / 1000 Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0108 Iteration 40, loss = 0.0184 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0164 --- Epoch 372 / 1000 Iteration 0, loss = 0.0159 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0291 Iteration 60, loss = 0.0209 Iteration 80, loss = 0.0187 --- Epoch 373 / 1000 Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0096 Iteration 40, loss = 0.0178 Iteration 60, loss = 0.0147 Iteration 80, loss = 0.0225 --- Epoch 374 / 1000 Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0041 --- Epoch 375 / 1000 Iteration 0, loss = 0.0222 Iteration 20, loss = 0.0768 Iteration 40, loss = 0.0165 Iteration 60, loss = 0.0192 Iteration 80, loss = 0.0051
--------------------------------------------------------------------------- KeyboardInterrupt Traceback (most recent call last) <ipython-input-215-506d6bf61503> in <module> ----> 1 train(model7, optimizer, epochs=1000, x_train=data["X_train_class"], y_train=data["y_train_class"], criterion=custom_loss) <ipython-input-164-7b479c5968e4> in train(model, optimizer, epochs, x_train, y_train, criterion) 38 # This is the backwards pass: compute the gradient of the loss with 39 # respect to each parameter of the model. ---> 40 loss.backward() 41 42 # Actually update the parameters of the model using the gradients /opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/tensor.py in backward(self, gradient, retain_graph, create_graph) 183 products. Defaults to ``False``. 184 """ --> 185 torch.autograd.backward(self, gradient, retain_graph, create_graph) 186 187 def register_hook(self, hook): /opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/autograd/__init__.py in backward(tensors, grad_tensors, retain_graph, create_graph, grad_variables) 125 Variable._execution_engine.run_backward( 126 tensors, grad_tensors, retain_graph, create_graph, --> 127 allow_unreachable=True) # allow_unreachable flag 128 129 KeyboardInterrupt:
testModel(model7, x_test=data["X_test_ship"], y_test=data["y_test_ship"])
--------------------------------------------------------------------------- NameError Traceback (most recent call last) <ipython-input-7-655c38579b03> in <module> ----> 1 testModel(model7, x_test=data["X_test_ship"], y_test=data["y_test_ship"]) NameError: name 'testModel' is not defined
class ConvNet3(nn.Module):
def __init__(self):
super().__init__()
self.epochsTrained = 0
self.batchnorm1 = nn.BatchNorm2d(32)
self.batchnorm2 = nn.BatchNorm2d(64)
self.batchnorm3 = nn.BatchNorm2d(128)
self.batchnorm4 = nn.BatchNorm2d(128)
self.batchnorm5 = nn.BatchNorm2d(64)
self.batchnorm6 = nn.BatchNorm2d(32)
self.upsample = nn.Upsample(scale_factor=2, mode='bilinear')
self.conv1 = nn.Conv2d(1, 32, kernel_size=3, padding=1)
self.conv2 = nn.Conv2d(32, 64, kernel_size=3, stride=2, padding=1)
self.conv3 = nn.Conv2d(64, 128, kernel_size=3, stride=2, padding=1)
self.conv4 = nn.Conv2d(128, 128, kernel_size=3, stride=2, padding=1)
self.conv5 = nn.Conv2d(128, 64, kernel_size=3, padding=1)
self.conv6 = nn.Conv2d(64, 32, kernel_size=3, padding=1)
self.conv7 = nn.Conv2d(32, 3, kernel_size=3, padding=1)
def forward(self, x):
x = x[0, :, :].unsqueeze(0).unsqueeze(0)
# Encoder
scores = F.relu(self.batchnorm1(self.conv1(x)))
scores = F.relu(self.batchnorm2(self.conv2(scores)))
scores = F.relu(self.batchnorm3(self.conv3(scores)))
scores = F.relu(self.batchnorm4(self.conv4(scores)))
# Decoder
scores = self.upsample(scores)
scores = F.relu(self.batchnorm5(self.conv5(scores)))
scores = self.upsample(scores)
scores = F.relu(self.batchnorm6(self.conv6(scores)))
scores = self.upsample(scores)
scores = torch.tanh(self.conv7(scores))
return scores
learning_rate = 5e-2
model8 = ConvNet3()
optimizer = optim.SGD(model8.parameters(), lr=learning_rate)
train(model8, optimizer, epochs=100000, x_train=data["X_train_class"], y_train=data["y_train_class"], criterion=nn.MSELoss())
--- Epoch 1 / 100000 Iteration 0, loss = 0.1976 Iteration 20, loss = 0.0927 Iteration 40, loss = 0.1733 Iteration 60, loss = 0.0530 Iteration 80, loss = 0.0337 --- Epoch 2 / 100000 Iteration 0, loss = 0.0477 Iteration 20, loss = 0.0444 Iteration 40, loss = 0.0882 Iteration 60, loss = 0.0287 Iteration 80, loss = 0.0167 --- Epoch 3 / 100000 Iteration 0, loss = 0.0318 Iteration 20, loss = 0.0313 Iteration 40, loss = 0.0402 Iteration 60, loss = 0.0319 Iteration 80, loss = 0.0271 --- Epoch 4 / 100000 Iteration 0, loss = 0.1399 Iteration 20, loss = 0.0340 Iteration 40, loss = 0.0406 Iteration 60, loss = 0.0521 Iteration 80, loss = 0.0920 --- Epoch 5 / 100000 Iteration 0, loss = 0.0605 Iteration 20, loss = 0.0213 Iteration 40, loss = 0.0415 Iteration 60, loss = 0.0706 Iteration 80, loss = 0.0520 --- Epoch 6 / 100000 Iteration 0, loss = 0.0535 Iteration 20, loss = 0.0244 Iteration 40, loss = 0.0672 Iteration 60, loss = 0.0459 Iteration 80, loss = 0.0288 --- Epoch 7 / 100000 Iteration 0, loss = 0.0341 Iteration 20, loss = 0.0614 Iteration 40, loss = 0.0282 Iteration 60, loss = 0.0438 Iteration 80, loss = 0.0370 --- Epoch 8 / 100000 Iteration 0, loss = 0.0380 Iteration 20, loss = 0.0354 Iteration 40, loss = 0.0258 Iteration 60, loss = 0.0358 Iteration 80, loss = 0.0340 --- Epoch 9 / 100000 Iteration 0, loss = 0.0496 Iteration 20, loss = 0.0540 Iteration 40, loss = 0.0313 Iteration 60, loss = 0.0265 Iteration 80, loss = 0.0287 --- Epoch 10 / 100000 Iteration 0, loss = 0.0360 Iteration 20, loss = 0.0247 Iteration 40, loss = 0.0380 Iteration 60, loss = 0.0584 Iteration 80, loss = 0.0485 --- Epoch 11 / 100000 Iteration 0, loss = 0.0334 Iteration 20, loss = 0.0365 Iteration 40, loss = 0.0245 Iteration 60, loss = 0.0408 Iteration 80, loss = 0.0423 --- Epoch 12 / 100000 Iteration 0, loss = 0.0347 Iteration 20, loss = 0.0254 Iteration 40, loss = 0.0262 Iteration 60, loss = 0.0203 Iteration 80, loss = 0.0754 --- Epoch 13 / 100000 Iteration 0, loss = 0.0351 Iteration 20, loss = 0.0237 Iteration 40, loss = 0.0437 Iteration 60, loss = 0.0341 Iteration 80, loss = 0.0482 --- Epoch 14 / 100000 Iteration 0, loss = 0.0326 Iteration 20, loss = 0.1028 Iteration 40, loss = 0.0316 Iteration 60, loss = 0.0360 Iteration 80, loss = 0.0439 --- Epoch 15 / 100000 Iteration 0, loss = 0.0764 Iteration 20, loss = 0.0274 Iteration 40, loss = 0.0196 Iteration 60, loss = 0.0262 Iteration 80, loss = 0.0331 --- Epoch 16 / 100000 Iteration 0, loss = 0.0450 Iteration 20, loss = 0.0352 Iteration 40, loss = 0.0206 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0636 --- Epoch 17 / 100000 Iteration 0, loss = 0.0328 Iteration 20, loss = 0.0384 Iteration 40, loss = 0.0201 Iteration 60, loss = 0.0609 Iteration 80, loss = 0.0288 --- Epoch 18 / 100000 Iteration 0, loss = 0.0740 Iteration 20, loss = 0.0288 Iteration 40, loss = 0.0257 Iteration 60, loss = 0.0446 Iteration 80, loss = 0.0555 --- Epoch 19 / 100000 Iteration 0, loss = 0.0608 Iteration 20, loss = 0.0210 Iteration 40, loss = 0.0368 Iteration 60, loss = 0.0220 Iteration 80, loss = 0.0565 --- Epoch 20 / 100000 Iteration 0, loss = 0.0355 Iteration 20, loss = 0.0769 Iteration 40, loss = 0.0236 Iteration 60, loss = 0.0232 Iteration 80, loss = 0.0690 --- Epoch 21 / 100000 Iteration 0, loss = 0.0260 Iteration 20, loss = 0.0500 Iteration 40, loss = 0.0284 Iteration 60, loss = 0.0251 Iteration 80, loss = 0.0297 --- Epoch 22 / 100000 Iteration 0, loss = 0.0381 Iteration 20, loss = 0.0148 Iteration 40, loss = 0.0207 Iteration 60, loss = 0.0218 Iteration 80, loss = 0.0194 --- Epoch 23 / 100000 Iteration 0, loss = 0.0172 Iteration 20, loss = 0.0309 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0252 Iteration 80, loss = 0.0331 --- Epoch 24 / 100000 Iteration 0, loss = 0.0360 Iteration 20, loss = 0.0739 Iteration 40, loss = 0.0271 Iteration 60, loss = 0.0274 Iteration 80, loss = 0.0224 --- Epoch 25 / 100000 Iteration 0, loss = 0.0675 Iteration 20, loss = 0.0219 Iteration 40, loss = 0.0374 Iteration 60, loss = 0.0255 Iteration 80, loss = 0.0583 --- Epoch 26 / 100000 Iteration 0, loss = 0.0353 Iteration 20, loss = 0.0301 Iteration 40, loss = 0.0452 Iteration 60, loss = 0.0239 Iteration 80, loss = 0.0224 --- Epoch 27 / 100000 Iteration 0, loss = 0.0582 Iteration 20, loss = 0.0410 Iteration 40, loss = 0.0372 Iteration 60, loss = 0.0138 Iteration 80, loss = 0.0599 --- Epoch 28 / 100000 Iteration 0, loss = 0.0430 Iteration 20, loss = 0.0259 Iteration 40, loss = 0.0174 Iteration 60, loss = 0.0475 Iteration 80, loss = 0.0303 --- Epoch 29 / 100000 Iteration 0, loss = 0.0277 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0263 Iteration 60, loss = 0.0296 Iteration 80, loss = 0.0255 --- Epoch 30 / 100000 Iteration 0, loss = 0.0309 Iteration 20, loss = 0.0323 Iteration 40, loss = 0.0285 Iteration 60, loss = 0.0521 Iteration 80, loss = 0.0162 --- Epoch 31 / 100000 Iteration 0, loss = 0.0313 Iteration 20, loss = 0.0175 Iteration 40, loss = 0.0211 Iteration 60, loss = 0.0433 Iteration 80, loss = 0.0287 --- Epoch 32 / 100000 Iteration 0, loss = 0.0298 Iteration 20, loss = 0.0414 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0536 Iteration 80, loss = 0.0246 --- Epoch 33 / 100000 Iteration 0, loss = 0.0730 Iteration 20, loss = 0.0395 Iteration 40, loss = 0.0476 Iteration 60, loss = 0.0152 Iteration 80, loss = 0.0332 --- Epoch 34 / 100000 Iteration 0, loss = 0.0482 Iteration 20, loss = 0.0509 Iteration 40, loss = 0.0369 Iteration 60, loss = 0.0318 Iteration 80, loss = 0.0278 --- Epoch 35 / 100000 Iteration 0, loss = 0.0236 Iteration 20, loss = 0.0674 Iteration 40, loss = 0.0588 Iteration 60, loss = 0.0473 Iteration 80, loss = 0.0314 --- Epoch 36 / 100000 Iteration 0, loss = 0.0172 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0778 Iteration 60, loss = 0.0372 Iteration 80, loss = 0.0194 --- Epoch 37 / 100000 Iteration 0, loss = 0.0307 Iteration 20, loss = 0.0323 Iteration 40, loss = 0.0429 Iteration 60, loss = 0.0272 Iteration 80, loss = 0.0203 --- Epoch 38 / 100000 Iteration 0, loss = 0.0503 Iteration 20, loss = 0.0177 Iteration 40, loss = 0.0308 Iteration 60, loss = 0.0372 Iteration 80, loss = 0.0377 --- Epoch 39 / 100000 Iteration 0, loss = 0.0306 Iteration 20, loss = 0.0362 Iteration 40, loss = 0.0341 Iteration 60, loss = 0.0250 Iteration 80, loss = 0.0344 --- Epoch 40 / 100000 Iteration 0, loss = 0.0152 Iteration 20, loss = 0.0255 Iteration 40, loss = 0.0200 Iteration 60, loss = 0.0238 Iteration 80, loss = 0.0166 --- Epoch 41 / 100000 Iteration 0, loss = 0.0561 Iteration 20, loss = 0.0557 Iteration 40, loss = 0.0315 Iteration 60, loss = 0.0167 Iteration 80, loss = 0.0309 --- Epoch 42 / 100000 Iteration 0, loss = 0.0339 Iteration 20, loss = 0.0273 Iteration 40, loss = 0.0242 Iteration 60, loss = 0.0335 Iteration 80, loss = 0.0088 --- Epoch 43 / 100000 Iteration 0, loss = 0.0207 Iteration 20, loss = 0.0332 Iteration 40, loss = 0.0199 Iteration 60, loss = 0.0365 Iteration 80, loss = 0.0149 --- Epoch 44 / 100000 Iteration 0, loss = 0.0241 Iteration 20, loss = 0.0277 Iteration 40, loss = 0.0322 Iteration 60, loss = 0.0141 Iteration 80, loss = 0.0184 --- Epoch 45 / 100000 Iteration 0, loss = 0.0376 Iteration 20, loss = 0.0237 Iteration 40, loss = 0.0341 Iteration 60, loss = 0.0267 Iteration 80, loss = 0.0710 --- Epoch 46 / 100000 Iteration 0, loss = 0.0311 Iteration 20, loss = 0.0150 Iteration 40, loss = 0.0210 Iteration 60, loss = 0.0282 Iteration 80, loss = 0.0380 --- Epoch 47 / 100000 Iteration 0, loss = 0.0225 Iteration 20, loss = 0.0276 Iteration 40, loss = 0.0203 Iteration 60, loss = 0.0241 Iteration 80, loss = 0.0517 --- Epoch 48 / 100000 Iteration 0, loss = 0.0220 Iteration 20, loss = 0.0689 Iteration 40, loss = 0.0451 Iteration 60, loss = 0.0430 Iteration 80, loss = 0.0217 --- Epoch 49 / 100000 Iteration 0, loss = 0.0159 Iteration 20, loss = 0.0243 Iteration 40, loss = 0.0316 Iteration 60, loss = 0.0185 Iteration 80, loss = 0.0327 --- Epoch 50 / 100000 Iteration 0, loss = 0.0283 Iteration 20, loss = 0.0206 Iteration 40, loss = 0.0288 Iteration 60, loss = 0.0274 Iteration 80, loss = 0.0187 --- Epoch 51 / 100000 Iteration 0, loss = 0.0285 Iteration 20, loss = 0.0183 Iteration 40, loss = 0.0244 Iteration 60, loss = 0.0278 Iteration 80, loss = 0.0256 --- Epoch 52 / 100000 Iteration 0, loss = 0.0192 Iteration 20, loss = 0.0375 Iteration 40, loss = 0.0173 Iteration 60, loss = 0.0467 Iteration 80, loss = 0.0378 --- Epoch 53 / 100000 Iteration 0, loss = 0.0385 Iteration 20, loss = 0.0208 Iteration 40, loss = 0.0355 Iteration 60, loss = 0.0177 Iteration 80, loss = 0.0161 --- Epoch 54 / 100000 Iteration 0, loss = 0.0229 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0315 Iteration 60, loss = 0.0478 Iteration 80, loss = 0.0824 --- Epoch 55 / 100000 Iteration 0, loss = 0.0202 Iteration 20, loss = 0.0190 Iteration 40, loss = 0.0150 Iteration 60, loss = 0.0137 Iteration 80, loss = 0.0324 --- Epoch 56 / 100000 Iteration 0, loss = 0.0191 Iteration 20, loss = 0.0187 Iteration 40, loss = 0.0197 Iteration 60, loss = 0.0164 Iteration 80, loss = 0.0195 --- Epoch 57 / 100000 Iteration 0, loss = 0.0454 Iteration 20, loss = 0.0171 Iteration 40, loss = 0.0229 Iteration 60, loss = 0.0178 Iteration 80, loss = 0.0260 --- Epoch 58 / 100000 Iteration 0, loss = 0.0570 Iteration 20, loss = 0.0897 Iteration 40, loss = 0.0759 Iteration 60, loss = 0.0204 Iteration 80, loss = 0.0340 --- Epoch 59 / 100000 Iteration 0, loss = 0.0257 Iteration 20, loss = 0.0310 Iteration 40, loss = 0.0392 Iteration 60, loss = 0.0135 Iteration 80, loss = 0.0248 --- Epoch 60 / 100000 Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0319 Iteration 40, loss = 0.0213 Iteration 60, loss = 0.0330 Iteration 80, loss = 0.0215 --- Epoch 61 / 100000 Iteration 0, loss = 0.0225 Iteration 20, loss = 0.0167 Iteration 40, loss = 0.0233 Iteration 60, loss = 0.0239 Iteration 80, loss = 0.0319 --- Epoch 62 / 100000 Iteration 0, loss = 0.0270 Iteration 20, loss = 0.0294 Iteration 40, loss = 0.0491 Iteration 60, loss = 0.0623 Iteration 80, loss = 0.0242 --- Epoch 63 / 100000 Iteration 0, loss = 0.0260 Iteration 20, loss = 0.0303 Iteration 40, loss = 0.0371 Iteration 60, loss = 0.0227 Iteration 80, loss = 0.0215 --- Epoch 64 / 100000 Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0332 Iteration 40, loss = 0.0287 Iteration 60, loss = 0.0266 Iteration 80, loss = 0.0345 --- Epoch 65 / 100000 Iteration 0, loss = 0.0283 Iteration 20, loss = 0.0217 Iteration 40, loss = 0.0406 Iteration 60, loss = 0.0139 Iteration 80, loss = 0.0389 --- Epoch 66 / 100000 Iteration 0, loss = 0.0226 Iteration 20, loss = 0.0322 Iteration 40, loss = 0.0352 Iteration 60, loss = 0.0248 Iteration 80, loss = 0.0280 --- Epoch 67 / 100000 Iteration 0, loss = 0.0285 Iteration 20, loss = 0.0263 Iteration 40, loss = 0.0181 Iteration 60, loss = 0.0156 Iteration 80, loss = 0.0253 --- Epoch 68 / 100000 Iteration 0, loss = 0.0392 Iteration 20, loss = 0.0395 Iteration 40, loss = 0.0183 Iteration 60, loss = 0.0287 Iteration 80, loss = 0.0183 --- Epoch 69 / 100000 Iteration 0, loss = 0.0332 Iteration 20, loss = 0.0385 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0229 Iteration 80, loss = 0.0363 --- Epoch 70 / 100000 Iteration 0, loss = 0.0212 Iteration 20, loss = 0.0185 Iteration 40, loss = 0.0277 Iteration 60, loss = 0.0171 Iteration 80, loss = 0.0144 --- Epoch 71 / 100000 Iteration 0, loss = 0.0285 Iteration 20, loss = 0.0099 Iteration 40, loss = 0.0290 Iteration 60, loss = 0.0198 Iteration 80, loss = 0.0247 --- Epoch 72 / 100000 Iteration 0, loss = 0.0381 Iteration 20, loss = 0.0227 Iteration 40, loss = 0.0326 Iteration 60, loss = 0.0121 Iteration 80, loss = 0.0179 --- Epoch 73 / 100000 Iteration 0, loss = 0.0402 Iteration 20, loss = 0.0261 Iteration 40, loss = 0.0379 Iteration 60, loss = 0.0181 Iteration 80, loss = 0.0308 --- Epoch 74 / 100000 Iteration 0, loss = 0.0251 Iteration 20, loss = 0.0297 Iteration 40, loss = 0.0208 Iteration 60, loss = 0.0305 Iteration 80, loss = 0.0356 --- Epoch 75 / 100000 Iteration 0, loss = 0.0310 Iteration 20, loss = 0.0190 Iteration 40, loss = 0.0249 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0238 --- Epoch 76 / 100000 Iteration 0, loss = 0.0275 Iteration 20, loss = 0.0329 Iteration 40, loss = 0.0217 Iteration 60, loss = 0.0305 Iteration 80, loss = 0.0284 --- Epoch 77 / 100000 Iteration 0, loss = 0.0220 Iteration 20, loss = 0.0245 Iteration 40, loss = 0.0403 Iteration 60, loss = 0.0206 Iteration 80, loss = 0.0242 --- Epoch 78 / 100000 Iteration 0, loss = 0.0239 Iteration 20, loss = 0.0199 Iteration 40, loss = 0.0417 Iteration 60, loss = 0.0130 Iteration 80, loss = 0.0430 --- Epoch 79 / 100000 Iteration 0, loss = 0.0256 Iteration 20, loss = 0.0243 Iteration 40, loss = 0.0357 Iteration 60, loss = 0.0135 Iteration 80, loss = 0.0177 --- Epoch 80 / 100000 Iteration 0, loss = 0.0210 Iteration 20, loss = 0.0531 Iteration 40, loss = 0.0184 Iteration 60, loss = 0.0169 Iteration 80, loss = 0.0487 --- Epoch 81 / 100000 Iteration 0, loss = 0.0206 Iteration 20, loss = 0.0164 Iteration 40, loss = 0.0191 Iteration 60, loss = 0.0179 Iteration 80, loss = 0.0157 --- Epoch 82 / 100000 Iteration 0, loss = 0.0194 Iteration 20, loss = 0.0216 Iteration 40, loss = 0.0312 Iteration 60, loss = 0.0270 Iteration 80, loss = 0.0436 --- Epoch 83 / 100000 Iteration 0, loss = 0.0171 Iteration 20, loss = 0.0294 Iteration 40, loss = 0.0332 Iteration 60, loss = 0.0247 Iteration 80, loss = 0.0224 --- Epoch 84 / 100000 Iteration 0, loss = 0.0260 Iteration 20, loss = 0.0207 Iteration 40, loss = 0.0165 Iteration 60, loss = 0.0264 Iteration 80, loss = 0.0151 --- Epoch 85 / 100000 Iteration 0, loss = 0.0211 Iteration 20, loss = 0.0254 Iteration 40, loss = 0.0105 Iteration 60, loss = 0.0221 Iteration 80, loss = 0.0168 --- Epoch 86 / 100000 Iteration 0, loss = 0.0250 Iteration 20, loss = 0.0250 Iteration 40, loss = 0.0197 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0146 --- Epoch 87 / 100000 Iteration 0, loss = 0.0265 Iteration 20, loss = 0.0162 Iteration 40, loss = 0.0204 Iteration 60, loss = 0.0237 Iteration 80, loss = 0.0191 --- Epoch 88 / 100000 Iteration 0, loss = 0.0210 Iteration 20, loss = 0.0311 Iteration 40, loss = 0.0146 Iteration 60, loss = 0.0142 Iteration 80, loss = 0.0300 --- Epoch 89 / 100000 Iteration 0, loss = 0.0158 Iteration 20, loss = 0.0232 Iteration 40, loss = 0.0157 Iteration 60, loss = 0.0246 Iteration 80, loss = 0.0397 --- Epoch 90 / 100000 Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0137 Iteration 40, loss = 0.0238 Iteration 60, loss = 0.0288 Iteration 80, loss = 0.0212 --- Epoch 91 / 100000 Iteration 0, loss = 0.0264 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0165 Iteration 60, loss = 0.0286 Iteration 80, loss = 0.0231 --- Epoch 92 / 100000 Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0360 Iteration 40, loss = 0.0284 Iteration 60, loss = 0.0213 Iteration 80, loss = 0.0144 --- Epoch 93 / 100000 Iteration 0, loss = 0.0203 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0324 Iteration 60, loss = 0.0249 Iteration 80, loss = 0.0140 --- Epoch 94 / 100000 Iteration 0, loss = 0.0274 Iteration 20, loss = 0.0140 Iteration 40, loss = 0.0208 Iteration 60, loss = 0.0304 Iteration 80, loss = 0.0288 --- Epoch 95 / 100000 Iteration 0, loss = 0.0307 Iteration 20, loss = 0.0267 Iteration 40, loss = 0.0235 Iteration 60, loss = 0.0296 Iteration 80, loss = 0.0162 --- Epoch 96 / 100000 Iteration 0, loss = 0.0239 Iteration 20, loss = 0.0380 Iteration 40, loss = 0.0309 Iteration 60, loss = 0.0385 Iteration 80, loss = 0.0264 --- Epoch 97 / 100000 Iteration 0, loss = 0.0205 Iteration 20, loss = 0.0240 Iteration 40, loss = 0.0172 Iteration 60, loss = 0.0205 Iteration 80, loss = 0.0205 --- Epoch 98 / 100000 Iteration 0, loss = 0.0321 Iteration 20, loss = 0.0177 Iteration 40, loss = 0.0446 Iteration 60, loss = 0.0272 Iteration 80, loss = 0.0128 --- Epoch 99 / 100000 Iteration 0, loss = 0.0177 Iteration 20, loss = 0.0213 Iteration 40, loss = 0.0370 Iteration 60, loss = 0.0160 Iteration 80, loss = 0.0273 --- Epoch 100 / 100000 Iteration 0, loss = 0.0165 Iteration 20, loss = 0.0218 Iteration 40, loss = 0.0358 Iteration 60, loss = 0.0330 Iteration 80, loss = 0.0278 --- Epoch 101 / 100000 Iteration 0, loss = 0.0082 Iteration 20, loss = 0.0287 Iteration 40, loss = 0.0354 Iteration 60, loss = 0.0304 Iteration 80, loss = 0.0155 --- Epoch 102 / 100000 Iteration 0, loss = 0.0369 Iteration 20, loss = 0.0282 Iteration 40, loss = 0.0177 Iteration 60, loss = 0.0197 Iteration 80, loss = 0.0251 --- Epoch 103 / 100000 Iteration 0, loss = 0.0282 Iteration 20, loss = 0.0186 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0235 Iteration 80, loss = 0.0505 --- Epoch 104 / 100000 Iteration 0, loss = 0.0222 Iteration 20, loss = 0.0290 Iteration 40, loss = 0.0215 Iteration 60, loss = 0.0255 Iteration 80, loss = 0.0255 --- Epoch 105 / 100000 Iteration 0, loss = 0.0590 Iteration 20, loss = 0.0231 Iteration 40, loss = 0.0360 Iteration 60, loss = 0.0256 Iteration 80, loss = 0.0158 --- Epoch 106 / 100000 Iteration 0, loss = 0.0207 Iteration 20, loss = 0.0402 Iteration 40, loss = 0.0454 Iteration 60, loss = 0.0185 Iteration 80, loss = 0.0253 --- Epoch 107 / 100000 Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0201 Iteration 40, loss = 0.0140 Iteration 60, loss = 0.0155 Iteration 80, loss = 0.0224 --- Epoch 108 / 100000 Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0162 Iteration 40, loss = 0.0330 Iteration 60, loss = 0.0233 Iteration 80, loss = 0.0241 --- Epoch 109 / 100000 Iteration 0, loss = 0.0288 Iteration 20, loss = 0.0341 Iteration 40, loss = 0.0246 Iteration 60, loss = 0.0242 Iteration 80, loss = 0.0233 --- Epoch 110 / 100000 Iteration 0, loss = 0.0174 Iteration 20, loss = 0.0180 Iteration 40, loss = 0.0192 Iteration 60, loss = 0.0214 Iteration 80, loss = 0.0143 --- Epoch 111 / 100000 Iteration 0, loss = 0.0279 Iteration 20, loss = 0.0162 Iteration 40, loss = 0.0472 Iteration 60, loss = 0.0628 Iteration 80, loss = 0.0128 --- Epoch 112 / 100000 Iteration 0, loss = 0.0282 Iteration 20, loss = 0.0173 Iteration 40, loss = 0.0227 Iteration 60, loss = 0.0255 Iteration 80, loss = 0.0439 --- Epoch 113 / 100000 Iteration 0, loss = 0.0318 Iteration 20, loss = 0.0152 Iteration 40, loss = 0.0161 Iteration 60, loss = 0.0138 Iteration 80, loss = 0.0138 --- Epoch 114 / 100000 Iteration 0, loss = 0.0211 Iteration 20, loss = 0.0158 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0213 Iteration 80, loss = 0.0068 --- Epoch 115 / 100000 Iteration 0, loss = 0.0392 Iteration 20, loss = 0.0210 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0168 Iteration 80, loss = 0.0318 --- Epoch 116 / 100000 Iteration 0, loss = 0.0215 Iteration 20, loss = 0.0212 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0455 Iteration 80, loss = 0.0164 --- Epoch 117 / 100000 Iteration 0, loss = 0.0174 Iteration 20, loss = 0.0326 Iteration 40, loss = 0.0198 Iteration 60, loss = 0.0260 Iteration 80, loss = 0.0137 --- Epoch 118 / 100000 Iteration 0, loss = 0.0276 Iteration 20, loss = 0.0231 Iteration 40, loss = 0.0203 Iteration 60, loss = 0.0317 Iteration 80, loss = 0.0301 --- Epoch 119 / 100000 Iteration 0, loss = 0.0246 Iteration 20, loss = 0.0231 Iteration 40, loss = 0.0160 Iteration 60, loss = 0.0425 Iteration 80, loss = 0.0187 --- Epoch 120 / 100000 Iteration 0, loss = 0.0140 Iteration 20, loss = 0.0129 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0159 Iteration 80, loss = 0.0167 --- Epoch 121 / 100000 Iteration 0, loss = 0.0264 Iteration 20, loss = 0.0197 Iteration 40, loss = 0.0166 Iteration 60, loss = 0.0207 Iteration 80, loss = 0.0552 --- Epoch 122 / 100000 Iteration 0, loss = 0.0159 Iteration 20, loss = 0.0175 Iteration 40, loss = 0.0188 Iteration 60, loss = 0.0216 Iteration 80, loss = 0.0103 --- Epoch 123 / 100000 Iteration 0, loss = 0.0231 Iteration 20, loss = 0.0302 Iteration 40, loss = 0.0198 Iteration 60, loss = 0.0242 Iteration 80, loss = 0.0205 --- Epoch 124 / 100000 Iteration 0, loss = 0.0166 Iteration 20, loss = 0.0150 Iteration 40, loss = 0.0199 Iteration 60, loss = 0.0189 Iteration 80, loss = 0.0284 --- Epoch 125 / 100000 Iteration 0, loss = 0.0206 Iteration 20, loss = 0.0254 Iteration 40, loss = 0.0204 Iteration 60, loss = 0.0160 Iteration 80, loss = 0.0107 --- Epoch 126 / 100000 Iteration 0, loss = 0.0166 Iteration 20, loss = 0.0134 Iteration 40, loss = 0.0282 Iteration 60, loss = 0.0173 Iteration 80, loss = 0.0119 --- Epoch 127 / 100000 Iteration 0, loss = 0.0288 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0195 Iteration 60, loss = 0.0164 Iteration 80, loss = 0.0141 --- Epoch 128 / 100000 Iteration 0, loss = 0.0158 Iteration 20, loss = 0.0309 Iteration 40, loss = 0.0308 Iteration 60, loss = 0.0194 Iteration 80, loss = 0.0294 --- Epoch 129 / 100000 Iteration 0, loss = 0.0203 Iteration 20, loss = 0.0303 Iteration 40, loss = 0.0430 Iteration 60, loss = 0.0255 Iteration 80, loss = 0.0589 --- Epoch 130 / 100000 Iteration 0, loss = 0.0207 Iteration 20, loss = 0.0589 Iteration 40, loss = 0.0171 Iteration 60, loss = 0.0170 Iteration 80, loss = 0.0205 --- Epoch 131 / 100000 Iteration 0, loss = 0.0239 Iteration 20, loss = 0.0223 Iteration 40, loss = 0.0166 Iteration 60, loss = 0.0146 Iteration 80, loss = 0.0380 --- Epoch 132 / 100000 Iteration 0, loss = 0.0330 Iteration 20, loss = 0.0370 Iteration 40, loss = 0.0430 Iteration 60, loss = 0.0117 Iteration 80, loss = 0.0126 --- Epoch 133 / 100000 Iteration 0, loss = 0.0315 Iteration 20, loss = 0.0293 Iteration 40, loss = 0.0286 Iteration 60, loss = 0.0230 Iteration 80, loss = 0.0348 --- Epoch 134 / 100000 Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0235 Iteration 40, loss = 0.0150 Iteration 60, loss = 0.0290 Iteration 80, loss = 0.0159 --- Epoch 135 / 100000 Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0209 Iteration 60, loss = 0.0378 Iteration 80, loss = 0.0283 --- Epoch 136 / 100000 Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0377 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0152 --- Epoch 137 / 100000 Iteration 0, loss = 0.0711 Iteration 20, loss = 0.0292 Iteration 40, loss = 0.0134 Iteration 60, loss = 0.0358 Iteration 80, loss = 0.0465 --- Epoch 138 / 100000 Iteration 0, loss = 0.0535 Iteration 20, loss = 0.0427 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0164 Iteration 80, loss = 0.0179 --- Epoch 139 / 100000 Iteration 0, loss = 0.0176 Iteration 20, loss = 0.0189 Iteration 40, loss = 0.0305 Iteration 60, loss = 0.0286 Iteration 80, loss = 0.0193 --- Epoch 140 / 100000 Iteration 0, loss = 0.0190 Iteration 20, loss = 0.0185 Iteration 40, loss = 0.0369 Iteration 60, loss = 0.0240 Iteration 80, loss = 0.0216 --- Epoch 141 / 100000 Iteration 0, loss = 0.0176 Iteration 20, loss = 0.0361 Iteration 40, loss = 0.0156 Iteration 60, loss = 0.0339 Iteration 80, loss = 0.0157 --- Epoch 142 / 100000 Iteration 0, loss = 0.0195 Iteration 20, loss = 0.0318 Iteration 40, loss = 0.0205 Iteration 60, loss = 0.0256 Iteration 80, loss = 0.0201 --- Epoch 143 / 100000 Iteration 0, loss = 0.0169 Iteration 20, loss = 0.0409 Iteration 40, loss = 0.0244 Iteration 60, loss = 0.0379 Iteration 80, loss = 0.0258 --- Epoch 144 / 100000 Iteration 0, loss = 0.0242 Iteration 20, loss = 0.0339 Iteration 40, loss = 0.0170 Iteration 60, loss = 0.0360 Iteration 80, loss = 0.0182 --- Epoch 145 / 100000 Iteration 0, loss = 0.0327 Iteration 20, loss = 0.0442 Iteration 40, loss = 0.0251 Iteration 60, loss = 0.0159 Iteration 80, loss = 0.0146 --- Epoch 146 / 100000 Iteration 0, loss = 0.0197 Iteration 20, loss = 0.0137 Iteration 40, loss = 0.0209 Iteration 60, loss = 0.0410 Iteration 80, loss = 0.0283 --- Epoch 147 / 100000 Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0259 Iteration 40, loss = 0.0146 Iteration 60, loss = 0.0327 Iteration 80, loss = 0.0260 --- Epoch 148 / 100000 Iteration 0, loss = 0.0213 Iteration 20, loss = 0.0193 Iteration 40, loss = 0.0207 Iteration 60, loss = 0.0167 Iteration 80, loss = 0.0350 --- Epoch 149 / 100000 Iteration 0, loss = 0.0252 Iteration 20, loss = 0.0203 Iteration 40, loss = 0.0224 Iteration 60, loss = 0.0335 Iteration 80, loss = 0.0256 --- Epoch 150 / 100000 Iteration 0, loss = 0.0084 Iteration 20, loss = 0.0132 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0258 Iteration 80, loss = 0.0143 --- Epoch 151 / 100000 Iteration 0, loss = 0.0313 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0135 Iteration 60, loss = 0.0183 Iteration 80, loss = 0.0503 --- Epoch 152 / 100000 Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0128 Iteration 40, loss = 0.0259 Iteration 60, loss = 0.0301 Iteration 80, loss = 0.0156 --- Epoch 153 / 100000 Iteration 0, loss = 0.0137 Iteration 20, loss = 0.0378 Iteration 40, loss = 0.0231 Iteration 60, loss = 0.0167 Iteration 80, loss = 0.0164 --- Epoch 154 / 100000 Iteration 0, loss = 0.0162 Iteration 20, loss = 0.0229 Iteration 40, loss = 0.0284 Iteration 60, loss = 0.0121 Iteration 80, loss = 0.0207 --- Epoch 155 / 100000 Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0159 Iteration 40, loss = 0.0188 Iteration 60, loss = 0.0190 Iteration 80, loss = 0.0225 --- Epoch 156 / 100000 Iteration 0, loss = 0.0281 Iteration 20, loss = 0.0389 Iteration 40, loss = 0.0348 Iteration 60, loss = 0.0414 Iteration 80, loss = 0.0276 --- Epoch 157 / 100000 Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0173 Iteration 40, loss = 0.0189 Iteration 60, loss = 0.0467 Iteration 80, loss = 0.0183 --- Epoch 158 / 100000 Iteration 0, loss = 0.0158 Iteration 20, loss = 0.0233 Iteration 40, loss = 0.0283 Iteration 60, loss = 0.0241 Iteration 80, loss = 0.0135 --- Epoch 159 / 100000 Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0260 Iteration 40, loss = 0.0169 Iteration 60, loss = 0.0170 Iteration 80, loss = 0.0151 --- Epoch 160 / 100000 Iteration 0, loss = 0.0237 Iteration 20, loss = 0.0275 Iteration 40, loss = 0.0302 Iteration 60, loss = 0.0349 Iteration 80, loss = 0.0142 --- Epoch 161 / 100000 Iteration 0, loss = 0.0255 Iteration 20, loss = 0.0161 Iteration 40, loss = 0.0219 Iteration 60, loss = 0.0207 Iteration 80, loss = 0.0125 --- Epoch 162 / 100000 Iteration 0, loss = 0.0291 Iteration 20, loss = 0.0208 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0194 Iteration 80, loss = 0.0212 --- Epoch 163 / 100000 Iteration 0, loss = 0.0214 Iteration 20, loss = 0.0199 Iteration 40, loss = 0.0181 Iteration 60, loss = 0.0470 Iteration 80, loss = 0.0134 --- Epoch 164 / 100000 Iteration 0, loss = 0.0171 Iteration 20, loss = 0.0327 Iteration 40, loss = 0.0256 Iteration 60, loss = 0.0259 Iteration 80, loss = 0.0168 --- Epoch 165 / 100000 Iteration 0, loss = 0.0244 Iteration 20, loss = 0.0168 Iteration 40, loss = 0.0146 Iteration 60, loss = 0.0267 Iteration 80, loss = 0.0186 --- Epoch 166 / 100000 Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0208 Iteration 40, loss = 0.0205 Iteration 60, loss = 0.0134 Iteration 80, loss = 0.0265 --- Epoch 167 / 100000 Iteration 0, loss = 0.0160 Iteration 20, loss = 0.0290 Iteration 40, loss = 0.0123 Iteration 60, loss = 0.0306 Iteration 80, loss = 0.0160 --- Epoch 168 / 100000 Iteration 0, loss = 0.0293 Iteration 20, loss = 0.0182 Iteration 40, loss = 0.0165 Iteration 60, loss = 0.0238 Iteration 80, loss = 0.0223 --- Epoch 169 / 100000 Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0208 Iteration 40, loss = 0.0142 Iteration 60, loss = 0.0431 Iteration 80, loss = 0.0467 --- Epoch 170 / 100000 Iteration 0, loss = 0.0173 Iteration 20, loss = 0.0154 Iteration 40, loss = 0.0287 Iteration 60, loss = 0.0132 Iteration 80, loss = 0.0161 --- Epoch 171 / 100000 Iteration 0, loss = 0.0210 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0269 Iteration 80, loss = 0.0226 --- Epoch 172 / 100000 Iteration 0, loss = 0.0261 Iteration 20, loss = 0.0184 Iteration 40, loss = 0.0312 Iteration 60, loss = 0.0482 Iteration 80, loss = 0.0632 --- Epoch 173 / 100000 Iteration 0, loss = 0.0403 Iteration 20, loss = 0.0194 Iteration 40, loss = 0.0252 Iteration 60, loss = 0.0111 Iteration 80, loss = 0.0252 --- Epoch 174 / 100000 Iteration 0, loss = 0.0284 Iteration 20, loss = 0.0179 Iteration 40, loss = 0.0204 Iteration 60, loss = 0.0233 Iteration 80, loss = 0.0335 --- Epoch 175 / 100000 Iteration 0, loss = 0.0179 Iteration 20, loss = 0.0181 Iteration 40, loss = 0.0218 Iteration 60, loss = 0.0346 Iteration 80, loss = 0.0165 --- Epoch 176 / 100000 Iteration 0, loss = 0.0185 Iteration 20, loss = 0.0176 Iteration 40, loss = 0.0179 Iteration 60, loss = 0.0312 Iteration 80, loss = 0.0155 --- Epoch 177 / 100000 Iteration 0, loss = 0.0165 Iteration 20, loss = 0.0171 Iteration 40, loss = 0.0196 Iteration 60, loss = 0.0248 Iteration 80, loss = 0.0158 --- Epoch 178 / 100000 Iteration 0, loss = 0.0204 Iteration 20, loss = 0.0263 Iteration 40, loss = 0.0349 Iteration 60, loss = 0.0228 Iteration 80, loss = 0.0208 --- Epoch 179 / 100000 Iteration 0, loss = 0.0104 Iteration 20, loss = 0.0179 Iteration 40, loss = 0.0236 Iteration 60, loss = 0.0234 Iteration 80, loss = 0.0188 --- Epoch 180 / 100000 Iteration 0, loss = 0.0235 Iteration 20, loss = 0.0297 Iteration 40, loss = 0.0235 Iteration 60, loss = 0.0182 Iteration 80, loss = 0.0218 --- Epoch 181 / 100000 Iteration 0, loss = 0.0217 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0214 Iteration 60, loss = 0.0140 Iteration 80, loss = 0.0209 --- Epoch 182 / 100000 Iteration 0, loss = 0.0296 Iteration 20, loss = 0.0162 Iteration 40, loss = 0.0268 Iteration 60, loss = 0.0225 Iteration 80, loss = 0.0103 --- Epoch 183 / 100000 Iteration 0, loss = 0.0130 Iteration 20, loss = 0.0140 Iteration 40, loss = 0.0352 Iteration 60, loss = 0.0296 Iteration 80, loss = 0.0224 --- Epoch 184 / 100000 Iteration 0, loss = 0.0204 Iteration 20, loss = 0.0159 Iteration 40, loss = 0.0826 Iteration 60, loss = 0.0175 Iteration 80, loss = 0.0198 --- Epoch 185 / 100000 Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0367 Iteration 40, loss = 0.0235 Iteration 60, loss = 0.0132 Iteration 80, loss = 0.0133 --- Epoch 186 / 100000 Iteration 0, loss = 0.0261 Iteration 20, loss = 0.0144 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0138 Iteration 80, loss = 0.0110 --- Epoch 187 / 100000 Iteration 0, loss = 0.0175 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0222 Iteration 60, loss = 0.0387 Iteration 80, loss = 0.0152 --- Epoch 188 / 100000 Iteration 0, loss = 0.0231 Iteration 20, loss = 0.0755 Iteration 40, loss = 0.0253 Iteration 60, loss = 0.0237 Iteration 80, loss = 0.0130 --- Epoch 189 / 100000 Iteration 0, loss = 0.0149 Iteration 20, loss = 0.0467 Iteration 40, loss = 0.0203 Iteration 60, loss = 0.0249 Iteration 80, loss = 0.0188 --- Epoch 190 / 100000 Iteration 0, loss = 0.0205 Iteration 20, loss = 0.0310 Iteration 40, loss = 0.0195 Iteration 60, loss = 0.0522 Iteration 80, loss = 0.0157 --- Epoch 191 / 100000 Iteration 0, loss = 0.0336 Iteration 20, loss = 0.0335 Iteration 40, loss = 0.0220 Iteration 60, loss = 0.0131 Iteration 80, loss = 0.0178 --- Epoch 192 / 100000 Iteration 0, loss = 0.0499 Iteration 20, loss = 0.0124 Iteration 40, loss = 0.0159 Iteration 60, loss = 0.0158 Iteration 80, loss = 0.0305 --- Epoch 193 / 100000 Iteration 0, loss = 0.0386 Iteration 20, loss = 0.0303 Iteration 40, loss = 0.0167 Iteration 60, loss = 0.0277 Iteration 80, loss = 0.0304 --- Epoch 194 / 100000 Iteration 0, loss = 0.0191 Iteration 20, loss = 0.0233 Iteration 40, loss = 0.0128 Iteration 60, loss = 0.0294 Iteration 80, loss = 0.0170 --- Epoch 195 / 100000 Iteration 0, loss = 0.0196 Iteration 20, loss = 0.0257 Iteration 40, loss = 0.0178 Iteration 60, loss = 0.0227 Iteration 80, loss = 0.0276 --- Epoch 196 / 100000 Iteration 0, loss = 0.0166 Iteration 20, loss = 0.0151 Iteration 40, loss = 0.0166 Iteration 60, loss = 0.0383 Iteration 80, loss = 0.0128 --- Epoch 197 / 100000 Iteration 0, loss = 0.0518 Iteration 20, loss = 0.0432 Iteration 40, loss = 0.0131 Iteration 60, loss = 0.0423 Iteration 80, loss = 0.0114 --- Epoch 198 / 100000 Iteration 0, loss = 0.0193 Iteration 20, loss = 0.0201 Iteration 40, loss = 0.0129 Iteration 60, loss = 0.0305 Iteration 80, loss = 0.0213 --- Epoch 199 / 100000 Iteration 0, loss = 0.0391 Iteration 20, loss = 0.0506 Iteration 40, loss = 0.0383 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0083 --- Epoch 200 / 100000 Iteration 0, loss = 0.0233 Iteration 20, loss = 0.0137 Iteration 40, loss = 0.0442 Iteration 60, loss = 0.0153 Iteration 80, loss = 0.0104 --- Epoch 201 / 100000 Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0206 Iteration 60, loss = 0.0147 Iteration 80, loss = 0.0263 --- Epoch 202 / 100000 Iteration 0, loss = 0.0252 Iteration 20, loss = 0.0315 Iteration 40, loss = 0.0131 Iteration 60, loss = 0.0218 Iteration 80, loss = 0.0331 --- Epoch 203 / 100000 Iteration 0, loss = 0.0130 Iteration 20, loss = 0.0149 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0215 Iteration 80, loss = 0.0352 --- Epoch 204 / 100000 Iteration 0, loss = 0.0141 Iteration 20, loss = 0.0227 Iteration 40, loss = 0.0189 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0576 --- Epoch 205 / 100000 Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0390 Iteration 40, loss = 0.0197 Iteration 60, loss = 0.0272 Iteration 80, loss = 0.0527 --- Epoch 206 / 100000 Iteration 0, loss = 0.0151 Iteration 20, loss = 0.0332 Iteration 40, loss = 0.0161 Iteration 60, loss = 0.0375 Iteration 80, loss = 0.0193 --- Epoch 207 / 100000 Iteration 0, loss = 0.0144 Iteration 20, loss = 0.0264 Iteration 40, loss = 0.0384 Iteration 60, loss = 0.0151 Iteration 80, loss = 0.0113 --- Epoch 208 / 100000 Iteration 0, loss = 0.0173 Iteration 20, loss = 0.0164 Iteration 40, loss = 0.0225 Iteration 60, loss = 0.0305 Iteration 80, loss = 0.0426 --- Epoch 209 / 100000 Iteration 0, loss = 0.0201 Iteration 20, loss = 0.0174 Iteration 40, loss = 0.0195 Iteration 60, loss = 0.0126 Iteration 80, loss = 0.0535 --- Epoch 210 / 100000 Iteration 0, loss = 0.0336 Iteration 20, loss = 0.0185 Iteration 40, loss = 0.0148 Iteration 60, loss = 0.0113 Iteration 80, loss = 0.0187 --- Epoch 211 / 100000 Iteration 0, loss = 0.0138 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0166 Iteration 60, loss = 0.0387 Iteration 80, loss = 0.0146 --- Epoch 212 / 100000 Iteration 0, loss = 0.0426 Iteration 20, loss = 0.0163 Iteration 40, loss = 0.0208 Iteration 60, loss = 0.0231 Iteration 80, loss = 0.0159 --- Epoch 213 / 100000 Iteration 0, loss = 0.0191 Iteration 20, loss = 0.0197 Iteration 40, loss = 0.0186 Iteration 60, loss = 0.0188 Iteration 80, loss = 0.0134 --- Epoch 214 / 100000 Iteration 0, loss = 0.0200 Iteration 20, loss = 0.0241 Iteration 40, loss = 0.0481 Iteration 60, loss = 0.0145 Iteration 80, loss = 0.0159 --- Epoch 215 / 100000 Iteration 0, loss = 0.0290 Iteration 20, loss = 0.0147 Iteration 40, loss = 0.0154 Iteration 60, loss = 0.0167 Iteration 80, loss = 0.0195 --- Epoch 216 / 100000 Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0116 Iteration 40, loss = 0.0301 Iteration 60, loss = 0.0157 Iteration 80, loss = 0.0271 --- Epoch 217 / 100000 Iteration 0, loss = 0.0168 Iteration 20, loss = 0.0391 Iteration 40, loss = 0.0169 Iteration 60, loss = 0.0233 Iteration 80, loss = 0.0152 --- Epoch 218 / 100000 Iteration 0, loss = 0.0178 Iteration 20, loss = 0.0149 Iteration 40, loss = 0.0114 Iteration 60, loss = 0.0317 Iteration 80, loss = 0.0127 --- Epoch 219 / 100000 Iteration 0, loss = 0.0116 Iteration 20, loss = 0.0240 Iteration 40, loss = 0.0303 Iteration 60, loss = 0.0134 Iteration 80, loss = 0.0240 --- Epoch 220 / 100000 Iteration 0, loss = 0.0267 Iteration 20, loss = 0.0303 Iteration 40, loss = 0.0165 Iteration 60, loss = 0.0214 Iteration 80, loss = 0.0188 --- Epoch 221 / 100000 Iteration 0, loss = 0.0349 Iteration 20, loss = 0.0213 Iteration 40, loss = 0.0167 Iteration 60, loss = 0.0182 Iteration 80, loss = 0.0244 --- Epoch 222 / 100000 Iteration 0, loss = 0.0168 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0324 Iteration 60, loss = 0.0273 Iteration 80, loss = 0.0412 --- Epoch 223 / 100000 Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0443 Iteration 40, loss = 0.0175 Iteration 60, loss = 0.0237 Iteration 80, loss = 0.0125 --- Epoch 224 / 100000 Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0141 Iteration 60, loss = 0.0121 Iteration 80, loss = 0.0248 --- Epoch 225 / 100000 Iteration 0, loss = 0.0357 Iteration 20, loss = 0.0328 Iteration 40, loss = 0.0188 Iteration 60, loss = 0.0132 Iteration 80, loss = 0.0222 --- Epoch 226 / 100000 Iteration 0, loss = 0.0186 Iteration 20, loss = 0.0149 Iteration 40, loss = 0.0377 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0282 --- Epoch 227 / 100000 Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0350 Iteration 40, loss = 0.0141 Iteration 60, loss = 0.0138 Iteration 80, loss = 0.0222 --- Epoch 228 / 100000 Iteration 0, loss = 0.0126 Iteration 20, loss = 0.0192 Iteration 40, loss = 0.0261 Iteration 60, loss = 0.0427 Iteration 80, loss = 0.0161 --- Epoch 229 / 100000 Iteration 0, loss = 0.0184 Iteration 20, loss = 0.0187 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0212 Iteration 80, loss = 0.0161 --- Epoch 230 / 100000 Iteration 0, loss = 0.0542 Iteration 20, loss = 0.0132 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0166 Iteration 80, loss = 0.0132 --- Epoch 231 / 100000 Iteration 0, loss = 0.0137 Iteration 20, loss = 0.0138 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0155 --- Epoch 232 / 100000 Iteration 0, loss = 0.0279 Iteration 20, loss = 0.0131 Iteration 40, loss = 0.0181 Iteration 60, loss = 0.0260 Iteration 80, loss = 0.0181 --- Epoch 233 / 100000 Iteration 0, loss = 0.0265 Iteration 20, loss = 0.0165 Iteration 40, loss = 0.0097 Iteration 60, loss = 0.0249 Iteration 80, loss = 0.0182 --- Epoch 234 / 100000 Iteration 0, loss = 0.0325 Iteration 20, loss = 0.0221 Iteration 40, loss = 0.0183 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0281 --- Epoch 235 / 100000 Iteration 0, loss = 0.0190 Iteration 20, loss = 0.0462 Iteration 40, loss = 0.0110 Iteration 60, loss = 0.0141 Iteration 80, loss = 0.0188 --- Epoch 236 / 100000 Iteration 0, loss = 0.0195 Iteration 20, loss = 0.0261 Iteration 40, loss = 0.0152 Iteration 60, loss = 0.0241 Iteration 80, loss = 0.0319 --- Epoch 237 / 100000 Iteration 0, loss = 0.0203 Iteration 20, loss = 0.0188 Iteration 40, loss = 0.0285 Iteration 60, loss = 0.0210 Iteration 80, loss = 0.0250 --- Epoch 238 / 100000 Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0245 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0151 Iteration 80, loss = 0.0082 --- Epoch 239 / 100000 Iteration 0, loss = 0.0137 Iteration 20, loss = 0.0241 Iteration 40, loss = 0.0162 Iteration 60, loss = 0.0236 Iteration 80, loss = 0.0126 --- Epoch 240 / 100000 Iteration 0, loss = 0.0236 Iteration 20, loss = 0.0275 Iteration 40, loss = 0.0608 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0137 --- Epoch 241 / 100000 Iteration 0, loss = 0.0311 Iteration 20, loss = 0.0177 Iteration 40, loss = 0.0183 Iteration 60, loss = 0.0146 Iteration 80, loss = 0.0411 --- Epoch 242 / 100000 Iteration 0, loss = 0.0228 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0445 Iteration 60, loss = 0.0192 Iteration 80, loss = 0.0320 --- Epoch 243 / 100000 Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0199 Iteration 40, loss = 0.0151 Iteration 60, loss = 0.0260 Iteration 80, loss = 0.0122 --- Epoch 244 / 100000 Iteration 0, loss = 0.0227 Iteration 20, loss = 0.0210 Iteration 40, loss = 0.0123 Iteration 60, loss = 0.0477 Iteration 80, loss = 0.0309 --- Epoch 245 / 100000 Iteration 0, loss = 0.0097 Iteration 20, loss = 0.0131 Iteration 40, loss = 0.0164 Iteration 60, loss = 0.0124 Iteration 80, loss = 0.0693 --- Epoch 246 / 100000 Iteration 0, loss = 0.0169 Iteration 20, loss = 0.0241 Iteration 40, loss = 0.0192 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0239 --- Epoch 247 / 100000 Iteration 0, loss = 0.0300 Iteration 20, loss = 0.0146 Iteration 40, loss = 0.0233 Iteration 60, loss = 0.0184 Iteration 80, loss = 0.0221 --- Epoch 248 / 100000 Iteration 0, loss = 0.0217 Iteration 20, loss = 0.0191 Iteration 40, loss = 0.0132 Iteration 60, loss = 0.0147 Iteration 80, loss = 0.0199 --- Epoch 249 / 100000 Iteration 0, loss = 0.0491 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0175 Iteration 60, loss = 0.0238 Iteration 80, loss = 0.0150 --- Epoch 250 / 100000 Iteration 0, loss = 0.0211 Iteration 20, loss = 0.0223 Iteration 40, loss = 0.0218 Iteration 60, loss = 0.0210 Iteration 80, loss = 0.0136 --- Epoch 251 / 100000 Iteration 0, loss = 0.0109 Iteration 20, loss = 0.0214 Iteration 40, loss = 0.0113 Iteration 60, loss = 0.0179 Iteration 80, loss = 0.0232 --- Epoch 252 / 100000 Iteration 0, loss = 0.0195 Iteration 20, loss = 0.0133 Iteration 40, loss = 0.0386 Iteration 60, loss = 0.0132 Iteration 80, loss = 0.0414 --- Epoch 253 / 100000 Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0299 Iteration 40, loss = 0.0285 Iteration 60, loss = 0.0370 Iteration 80, loss = 0.0100 --- Epoch 254 / 100000 Iteration 0, loss = 0.0438 Iteration 20, loss = 0.0639 Iteration 40, loss = 0.0157 Iteration 60, loss = 0.0210 Iteration 80, loss = 0.0116 --- Epoch 255 / 100000 Iteration 0, loss = 0.0239 Iteration 20, loss = 0.0158 Iteration 40, loss = 0.0114 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0084 --- Epoch 256 / 100000 Iteration 0, loss = 0.0178 Iteration 20, loss = 0.0268 Iteration 40, loss = 0.0113 Iteration 60, loss = 0.0278 Iteration 80, loss = 0.0157 --- Epoch 257 / 100000 Iteration 0, loss = 0.0178 Iteration 20, loss = 0.0385 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0159 Iteration 80, loss = 0.0119 --- Epoch 258 / 100000 Iteration 0, loss = 0.0312 Iteration 20, loss = 0.0140 Iteration 40, loss = 0.0195 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0161 --- Epoch 259 / 100000 Iteration 0, loss = 0.0274 Iteration 20, loss = 0.0339 Iteration 40, loss = 0.0163 Iteration 60, loss = 0.0164 Iteration 80, loss = 0.0158 --- Epoch 260 / 100000 Iteration 0, loss = 0.0286 Iteration 20, loss = 0.0190 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0121 Iteration 80, loss = 0.0119 --- Epoch 261 / 100000 Iteration 0, loss = 0.0310 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0286 Iteration 60, loss = 0.0142 Iteration 80, loss = 0.0143 --- Epoch 262 / 100000 Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0169 Iteration 40, loss = 0.0240 Iteration 60, loss = 0.0140 Iteration 80, loss = 0.0171 --- Epoch 263 / 100000 Iteration 0, loss = 0.0145 Iteration 20, loss = 0.0166 Iteration 40, loss = 0.0256 Iteration 60, loss = 0.0117 Iteration 80, loss = 0.0127 --- Epoch 264 / 100000 Iteration 0, loss = 0.0533 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0232 Iteration 60, loss = 0.0126 Iteration 80, loss = 0.0112 --- Epoch 265 / 100000 Iteration 0, loss = 0.0259 Iteration 20, loss = 0.0187 Iteration 40, loss = 0.0311 Iteration 60, loss = 0.0157 Iteration 80, loss = 0.0138 --- Epoch 266 / 100000 Iteration 0, loss = 0.0211 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0206 Iteration 60, loss = 0.0181 Iteration 80, loss = 0.0183 --- Epoch 267 / 100000 Iteration 0, loss = 0.0116 Iteration 20, loss = 0.0233 Iteration 40, loss = 0.0335 Iteration 60, loss = 0.0284 Iteration 80, loss = 0.0136 --- Epoch 268 / 100000 Iteration 0, loss = 0.0205 Iteration 20, loss = 0.0130 Iteration 40, loss = 0.0384 Iteration 60, loss = 0.0290 Iteration 80, loss = 0.0230 --- Epoch 269 / 100000 Iteration 0, loss = 0.0184 Iteration 20, loss = 0.0129 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0301 Iteration 80, loss = 0.0269 --- Epoch 270 / 100000 Iteration 0, loss = 0.0226 Iteration 20, loss = 0.0190 Iteration 40, loss = 0.0204 Iteration 60, loss = 0.0163 Iteration 80, loss = 0.0176 --- Epoch 271 / 100000 Iteration 0, loss = 0.0162 Iteration 20, loss = 0.0206 Iteration 40, loss = 0.0270 Iteration 60, loss = 0.0115 Iteration 80, loss = 0.0294 --- Epoch 272 / 100000 Iteration 0, loss = 0.0153 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0187 Iteration 60, loss = 0.0216 Iteration 80, loss = 0.0146 --- Epoch 273 / 100000 Iteration 0, loss = 0.0110 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0207 Iteration 60, loss = 0.0113 Iteration 80, loss = 0.0210 --- Epoch 274 / 100000 Iteration 0, loss = 0.0212 Iteration 20, loss = 0.0189 Iteration 40, loss = 0.0230 Iteration 60, loss = 0.0398 Iteration 80, loss = 0.0107 --- Epoch 275 / 100000 Iteration 0, loss = 0.0113 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0151 Iteration 60, loss = 0.0244 Iteration 80, loss = 0.0266 --- Epoch 276 / 100000 Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0130 Iteration 40, loss = 0.0172 Iteration 60, loss = 0.0175 Iteration 80, loss = 0.0137 --- Epoch 277 / 100000 Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0293 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0194 --- Epoch 278 / 100000 Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0328 Iteration 40, loss = 0.0181 Iteration 60, loss = 0.0208 Iteration 80, loss = 0.0216 --- Epoch 279 / 100000 Iteration 0, loss = 0.0325 Iteration 20, loss = 0.0114 Iteration 40, loss = 0.0298 Iteration 60, loss = 0.0332 Iteration 80, loss = 0.0144 --- Epoch 280 / 100000 Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0280 Iteration 40, loss = 0.0196 Iteration 60, loss = 0.0230 Iteration 80, loss = 0.0292 --- Epoch 281 / 100000 Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0085 Iteration 40, loss = 0.0232 Iteration 60, loss = 0.0144 Iteration 80, loss = 0.0171 --- Epoch 282 / 100000 Iteration 0, loss = 0.0265 Iteration 20, loss = 0.0164 Iteration 40, loss = 0.0182 Iteration 60, loss = 0.0159 Iteration 80, loss = 0.0220 --- Epoch 283 / 100000 Iteration 0, loss = 0.0207 Iteration 20, loss = 0.0173 Iteration 40, loss = 0.0160 Iteration 60, loss = 0.0151 Iteration 80, loss = 0.0165 --- Epoch 284 / 100000 Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0152 Iteration 40, loss = 0.0188 Iteration 60, loss = 0.0157 Iteration 80, loss = 0.0258 --- Epoch 285 / 100000 Iteration 0, loss = 0.0221 Iteration 20, loss = 0.0200 Iteration 40, loss = 0.0208 Iteration 60, loss = 0.0162 Iteration 80, loss = 0.0150 --- Epoch 286 / 100000 Iteration 0, loss = 0.0276 Iteration 20, loss = 0.0157 Iteration 40, loss = 0.0148 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0335 --- Epoch 287 / 100000 Iteration 0, loss = 0.0213 Iteration 20, loss = 0.0296 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0188 Iteration 80, loss = 0.0124 --- Epoch 288 / 100000 Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0147 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0388 Iteration 80, loss = 0.0169 --- Epoch 289 / 100000 Iteration 0, loss = 0.0172 Iteration 20, loss = 0.0253 Iteration 40, loss = 0.0169 Iteration 60, loss = 0.0140 Iteration 80, loss = 0.0134 --- Epoch 290 / 100000 Iteration 0, loss = 0.0276 Iteration 20, loss = 0.0216 Iteration 40, loss = 0.0249 Iteration 60, loss = 0.0217 Iteration 80, loss = 0.0330 --- Epoch 291 / 100000 Iteration 0, loss = 0.0110 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0202 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0163 --- Epoch 292 / 100000 Iteration 0, loss = 0.0615 Iteration 20, loss = 0.0176 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0384 Iteration 80, loss = 0.0094 --- Epoch 293 / 100000 Iteration 0, loss = 0.0187 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0135 Iteration 60, loss = 0.0463 Iteration 80, loss = 0.0202 --- Epoch 294 / 100000 Iteration 0, loss = 0.0172 Iteration 20, loss = 0.0170 Iteration 40, loss = 0.0171 Iteration 60, loss = 0.0116 Iteration 80, loss = 0.0103 --- Epoch 295 / 100000 Iteration 0, loss = 0.0242 Iteration 20, loss = 0.0138 Iteration 40, loss = 0.0139 Iteration 60, loss = 0.0412 Iteration 80, loss = 0.0174 --- Epoch 296 / 100000 Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0282 Iteration 60, loss = 0.0143 Iteration 80, loss = 0.0192 --- Epoch 297 / 100000 Iteration 0, loss = 0.0198 Iteration 20, loss = 0.0157 Iteration 40, loss = 0.0294 Iteration 60, loss = 0.0173 Iteration 80, loss = 0.0162 --- Epoch 298 / 100000 Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0141 Iteration 40, loss = 0.0170 Iteration 60, loss = 0.0157 Iteration 80, loss = 0.0142 --- Epoch 299 / 100000 Iteration 0, loss = 0.0219 Iteration 20, loss = 0.0166 Iteration 40, loss = 0.0215 Iteration 60, loss = 0.0225 Iteration 80, loss = 0.0121 --- Epoch 300 / 100000 Iteration 0, loss = 0.0449 Iteration 20, loss = 0.0126 Iteration 40, loss = 0.0593 Iteration 60, loss = 0.0182 Iteration 80, loss = 0.0200 --- Epoch 301 / 100000 Iteration 0, loss = 0.0127 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0165 Iteration 80, loss = 0.0166 --- Epoch 302 / 100000 Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0218 Iteration 40, loss = 0.0135 Iteration 60, loss = 0.0185 Iteration 80, loss = 0.0130 --- Epoch 303 / 100000 Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0184 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0156 Iteration 80, loss = 0.0190 --- Epoch 304 / 100000 Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0208 Iteration 40, loss = 0.0311 Iteration 60, loss = 0.0147 Iteration 80, loss = 0.0201 --- Epoch 305 / 100000 Iteration 0, loss = 0.0597 Iteration 20, loss = 0.0251 Iteration 40, loss = 0.0241 Iteration 60, loss = 0.0175 Iteration 80, loss = 0.0152 --- Epoch 306 / 100000 Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0155 Iteration 40, loss = 0.0152 Iteration 60, loss = 0.0319 Iteration 80, loss = 0.0282 --- Epoch 307 / 100000 Iteration 0, loss = 0.0154 Iteration 20, loss = 0.0150 Iteration 40, loss = 0.0171 Iteration 60, loss = 0.0342 Iteration 80, loss = 0.0150 --- Epoch 308 / 100000 Iteration 0, loss = 0.0174 Iteration 20, loss = 0.0217 Iteration 40, loss = 0.0163 Iteration 60, loss = 0.0136 Iteration 80, loss = 0.0193 --- Epoch 309 / 100000 Iteration 0, loss = 0.0170 Iteration 20, loss = 0.0317 Iteration 40, loss = 0.0203 Iteration 60, loss = 0.0164 Iteration 80, loss = 0.0251 --- Epoch 310 / 100000 Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0189 Iteration 40, loss = 0.0159 Iteration 60, loss = 0.0188 Iteration 80, loss = 0.0189 --- Epoch 311 / 100000 Iteration 0, loss = 0.0185 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0213 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0244 --- Epoch 312 / 100000 Iteration 0, loss = 0.0299 Iteration 20, loss = 0.0275 Iteration 40, loss = 0.0160 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0127 --- Epoch 313 / 100000 Iteration 0, loss = 0.0338 Iteration 20, loss = 0.0126 Iteration 40, loss = 0.0152 Iteration 60, loss = 0.0288 Iteration 80, loss = 0.0178 --- Epoch 314 / 100000 Iteration 0, loss = 0.0096 Iteration 20, loss = 0.0223 Iteration 40, loss = 0.0195 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0123 --- Epoch 315 / 100000 Iteration 0, loss = 0.0757 Iteration 20, loss = 0.0162 Iteration 40, loss = 0.0114 Iteration 60, loss = 0.0211 Iteration 80, loss = 0.0231 --- Epoch 316 / 100000 Iteration 0, loss = 0.0224 Iteration 20, loss = 0.0346 Iteration 40, loss = 0.0185 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0098 --- Epoch 317 / 100000 Iteration 0, loss = 0.0225 Iteration 20, loss = 0.0290 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0157 Iteration 80, loss = 0.0209 --- Epoch 318 / 100000 Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0329 Iteration 40, loss = 0.0322 Iteration 60, loss = 0.0344 Iteration 80, loss = 0.0181 --- Epoch 319 / 100000 Iteration 0, loss = 0.0254 Iteration 20, loss = 0.0129 Iteration 40, loss = 0.0187 Iteration 60, loss = 0.0188 Iteration 80, loss = 0.0283 --- Epoch 320 / 100000 Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0154 Iteration 60, loss = 0.0178 Iteration 80, loss = 0.0248 --- Epoch 321 / 100000 Iteration 0, loss = 0.0214 Iteration 20, loss = 0.0172 Iteration 40, loss = 0.0312 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0154 --- Epoch 322 / 100000 Iteration 0, loss = 0.0233 Iteration 20, loss = 0.0201 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0204 Iteration 80, loss = 0.0228 --- Epoch 323 / 100000 Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0171 Iteration 60, loss = 0.0226 Iteration 80, loss = 0.0230 --- Epoch 324 / 100000 Iteration 0, loss = 0.0394 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0300 --- Epoch 325 / 100000 Iteration 0, loss = 0.0139 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0329 Iteration 80, loss = 0.0155 --- Epoch 326 / 100000 Iteration 0, loss = 0.0243 Iteration 20, loss = 0.0350 Iteration 40, loss = 0.0203 Iteration 60, loss = 0.0193 Iteration 80, loss = 0.0106 --- Epoch 327 / 100000 Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0143 Iteration 80, loss = 0.0670 --- Epoch 328 / 100000 Iteration 0, loss = 0.0449 Iteration 20, loss = 0.0281 Iteration 40, loss = 0.0131 Iteration 60, loss = 0.0258 Iteration 80, loss = 0.0148 --- Epoch 329 / 100000 Iteration 0, loss = 0.0136 Iteration 20, loss = 0.0138 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0171 Iteration 80, loss = 0.0214 --- Epoch 330 / 100000 Iteration 0, loss = 0.0172 Iteration 20, loss = 0.0245 Iteration 40, loss = 0.0162 Iteration 60, loss = 0.0124 Iteration 80, loss = 0.0198 --- Epoch 331 / 100000 Iteration 0, loss = 0.0140 Iteration 20, loss = 0.0306 Iteration 40, loss = 0.0233 Iteration 60, loss = 0.0298 Iteration 80, loss = 0.0296 --- Epoch 332 / 100000 Iteration 0, loss = 0.0178 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0142 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0149 --- Epoch 333 / 100000 Iteration 0, loss = 0.0316 Iteration 20, loss = 0.0142 Iteration 40, loss = 0.0276 Iteration 60, loss = 0.0123 Iteration 80, loss = 0.0187 --- Epoch 334 / 100000 Iteration 0, loss = 0.0274 Iteration 20, loss = 0.0142 Iteration 40, loss = 0.0137 Iteration 60, loss = 0.0238 Iteration 80, loss = 0.0116 --- Epoch 335 / 100000 Iteration 0, loss = 0.0178 Iteration 20, loss = 0.0158 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0175 Iteration 80, loss = 0.0198 --- Epoch 336 / 100000 Iteration 0, loss = 0.0153 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0142 Iteration 60, loss = 0.0229 Iteration 80, loss = 0.0162 --- Epoch 337 / 100000 Iteration 0, loss = 0.0214 Iteration 20, loss = 0.0187 Iteration 40, loss = 0.0187 Iteration 60, loss = 0.0117 Iteration 80, loss = 0.0152 --- Epoch 338 / 100000 Iteration 0, loss = 0.0149 Iteration 20, loss = 0.0312 Iteration 40, loss = 0.0263 Iteration 60, loss = 0.0099 Iteration 80, loss = 0.0169 --- Epoch 339 / 100000 Iteration 0, loss = 0.0204 Iteration 20, loss = 0.0144 Iteration 40, loss = 0.0198 Iteration 60, loss = 0.0250 Iteration 80, loss = 0.0427 --- Epoch 340 / 100000 Iteration 0, loss = 0.0238 Iteration 20, loss = 0.0278 Iteration 40, loss = 0.0129 Iteration 60, loss = 0.0131 Iteration 80, loss = 0.0282 --- Epoch 341 / 100000 Iteration 0, loss = 0.0149 Iteration 20, loss = 0.0532 Iteration 40, loss = 0.0324 Iteration 60, loss = 0.0156 Iteration 80, loss = 0.0313 --- Epoch 342 / 100000 Iteration 0, loss = 0.0183 Iteration 20, loss = 0.0138 Iteration 40, loss = 0.0144 Iteration 60, loss = 0.0202 Iteration 80, loss = 0.0328 --- Epoch 343 / 100000 Iteration 0, loss = 0.0270 Iteration 20, loss = 0.0157 Iteration 40, loss = 0.0209 Iteration 60, loss = 0.0108 Iteration 80, loss = 0.0212 --- Epoch 344 / 100000 Iteration 0, loss = 0.0232 Iteration 20, loss = 0.0128 Iteration 40, loss = 0.0200 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0217 --- Epoch 345 / 100000 Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0194 Iteration 40, loss = 0.0461 Iteration 60, loss = 0.0156 Iteration 80, loss = 0.0125 --- Epoch 346 / 100000 Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0210 Iteration 40, loss = 0.0177 Iteration 60, loss = 0.0233 Iteration 80, loss = 0.0182 --- Epoch 347 / 100000 Iteration 0, loss = 0.0215 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0112 Iteration 60, loss = 0.0134 Iteration 80, loss = 0.0251 --- Epoch 348 / 100000 Iteration 0, loss = 0.0226 Iteration 20, loss = 0.0201 Iteration 40, loss = 0.0168 Iteration 60, loss = 0.0199 Iteration 80, loss = 0.0110 --- Epoch 349 / 100000 Iteration 0, loss = 0.0167 Iteration 20, loss = 0.0257 Iteration 40, loss = 0.0113 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0100 --- Epoch 350 / 100000 Iteration 0, loss = 0.0218 Iteration 20, loss = 0.0144 Iteration 40, loss = 0.0165 Iteration 60, loss = 0.0247 Iteration 80, loss = 0.0261 --- Epoch 351 / 100000 Iteration 0, loss = 0.0162 Iteration 20, loss = 0.0117 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0323 Iteration 80, loss = 0.0109 --- Epoch 352 / 100000 Iteration 0, loss = 0.0138 Iteration 20, loss = 0.0263 Iteration 40, loss = 0.0205 Iteration 60, loss = 0.0211 Iteration 80, loss = 0.0138 --- Epoch 353 / 100000 Iteration 0, loss = 0.0169 Iteration 20, loss = 0.0220 Iteration 40, loss = 0.0812 Iteration 60, loss = 0.0152 Iteration 80, loss = 0.0162 --- Epoch 354 / 100000 Iteration 0, loss = 0.0100 Iteration 20, loss = 0.0168 Iteration 40, loss = 0.0253 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0247 --- Epoch 355 / 100000 Iteration 0, loss = 0.0150 Iteration 20, loss = 0.0123 Iteration 40, loss = 0.0187 Iteration 60, loss = 0.0113 Iteration 80, loss = 0.0094 --- Epoch 356 / 100000 Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0085 Iteration 40, loss = 0.0110 Iteration 60, loss = 0.0135 Iteration 80, loss = 0.0412 --- Epoch 357 / 100000 Iteration 0, loss = 0.0148 Iteration 20, loss = 0.0294 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0162 --- Epoch 358 / 100000 Iteration 0, loss = 0.0173 Iteration 20, loss = 0.0270 Iteration 40, loss = 0.0254 Iteration 60, loss = 0.0258 Iteration 80, loss = 0.0110 --- Epoch 359 / 100000 Iteration 0, loss = 0.0268 Iteration 20, loss = 0.0112 Iteration 40, loss = 0.0145 Iteration 60, loss = 0.0186 Iteration 80, loss = 0.0188 --- Epoch 360 / 100000 Iteration 0, loss = 0.0199 Iteration 20, loss = 0.0155 Iteration 40, loss = 0.0179 Iteration 60, loss = 0.0269 Iteration 80, loss = 0.0104 --- Epoch 361 / 100000 Iteration 0, loss = 0.0207 Iteration 20, loss = 0.0222 Iteration 40, loss = 0.0093 Iteration 60, loss = 0.0343 Iteration 80, loss = 0.0260 --- Epoch 362 / 100000 Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0142 Iteration 40, loss = 0.0170 Iteration 60, loss = 0.0143 Iteration 80, loss = 0.0168 --- Epoch 363 / 100000 Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0528 Iteration 40, loss = 0.0136 Iteration 60, loss = 0.0167 Iteration 80, loss = 0.0197 --- Epoch 364 / 100000 Iteration 0, loss = 0.0203 Iteration 20, loss = 0.0194 Iteration 40, loss = 0.0522 Iteration 60, loss = 0.0343 Iteration 80, loss = 0.0220 --- Epoch 365 / 100000 Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0175 Iteration 40, loss = 0.0439 Iteration 60, loss = 0.0279 Iteration 80, loss = 0.0201 --- Epoch 366 / 100000 Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0153 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0164 --- Epoch 367 / 100000 Iteration 0, loss = 0.0158 Iteration 20, loss = 0.0126 Iteration 40, loss = 0.0179 Iteration 60, loss = 0.0187 Iteration 80, loss = 0.0174 --- Epoch 368 / 100000 Iteration 0, loss = 0.0160 Iteration 20, loss = 0.0195 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0403 Iteration 80, loss = 0.0219 --- Epoch 369 / 100000 Iteration 0, loss = 0.0104 Iteration 20, loss = 0.0191 Iteration 40, loss = 0.0198 Iteration 60, loss = 0.0286 Iteration 80, loss = 0.0183 --- Epoch 370 / 100000 Iteration 0, loss = 0.0120 Iteration 20, loss = 0.0247 Iteration 40, loss = 0.0152 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0081 --- Epoch 371 / 100000 Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0133 Iteration 40, loss = 0.0164 Iteration 60, loss = 0.0180 Iteration 80, loss = 0.0092 --- Epoch 372 / 100000 Iteration 0, loss = 0.0154 Iteration 20, loss = 0.0193 Iteration 40, loss = 0.0262 Iteration 60, loss = 0.0182 Iteration 80, loss = 0.0140 --- Epoch 373 / 100000 Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0156 Iteration 40, loss = 0.0189 Iteration 60, loss = 0.0156 Iteration 80, loss = 0.0184 --- Epoch 374 / 100000 Iteration 0, loss = 0.0146 Iteration 20, loss = 0.0218 Iteration 40, loss = 0.0171 Iteration 60, loss = 0.0278 Iteration 80, loss = 0.0392 --- Epoch 375 / 100000 Iteration 0, loss = 0.0318 Iteration 20, loss = 0.0263 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0166 Iteration 80, loss = 0.0160 --- Epoch 376 / 100000 Iteration 0, loss = 0.0211 Iteration 20, loss = 0.0149 Iteration 40, loss = 0.0238 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0219 --- Epoch 377 / 100000 Iteration 0, loss = 0.0172 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0378 Iteration 80, loss = 0.0192 --- Epoch 378 / 100000 Iteration 0, loss = 0.0179 Iteration 20, loss = 0.0147 Iteration 40, loss = 0.0328 Iteration 60, loss = 0.0279 Iteration 80, loss = 0.0270 --- Epoch 379 / 100000 Iteration 0, loss = 0.0270 Iteration 20, loss = 0.0253 Iteration 40, loss = 0.0251 Iteration 60, loss = 0.0152 Iteration 80, loss = 0.0186 --- Epoch 380 / 100000 Iteration 0, loss = 0.0163 Iteration 20, loss = 0.0138 Iteration 40, loss = 0.0287 Iteration 60, loss = 0.0141 Iteration 80, loss = 0.0267 --- Epoch 381 / 100000 Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0136 Iteration 40, loss = 0.0253 Iteration 60, loss = 0.0141 Iteration 80, loss = 0.0153 --- Epoch 382 / 100000 Iteration 0, loss = 0.0155 Iteration 20, loss = 0.0198 Iteration 40, loss = 0.0133 Iteration 60, loss = 0.0147 Iteration 80, loss = 0.0128 --- Epoch 383 / 100000 Iteration 0, loss = 0.0235 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0196 Iteration 60, loss = 0.0154 Iteration 80, loss = 0.0117 --- Epoch 384 / 100000 Iteration 0, loss = 0.0141 Iteration 20, loss = 0.0111 Iteration 40, loss = 0.0244 Iteration 60, loss = 0.0152 Iteration 80, loss = 0.0164 --- Epoch 385 / 100000 Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0205 Iteration 40, loss = 0.0202 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0160 --- Epoch 386 / 100000 Iteration 0, loss = 0.0097 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0128 Iteration 80, loss = 0.0122 --- Epoch 387 / 100000 Iteration 0, loss = 0.0120 Iteration 20, loss = 0.0162 Iteration 40, loss = 0.0224 Iteration 60, loss = 0.0173 Iteration 80, loss = 0.0359 --- Epoch 388 / 100000 Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0140 Iteration 40, loss = 0.0140 Iteration 60, loss = 0.0225 Iteration 80, loss = 0.0276 --- Epoch 389 / 100000 Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0151 Iteration 60, loss = 0.0161 Iteration 80, loss = 0.0226 --- Epoch 390 / 100000 Iteration 0, loss = 0.0160 Iteration 20, loss = 0.0153 Iteration 40, loss = 0.0199 Iteration 60, loss = 0.0168 Iteration 80, loss = 0.0223 --- Epoch 391 / 100000 Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0150 Iteration 40, loss = 0.0145 Iteration 60, loss = 0.0229 Iteration 80, loss = 0.0173 --- Epoch 392 / 100000 Iteration 0, loss = 0.0152 Iteration 20, loss = 0.0179 Iteration 40, loss = 0.0128 Iteration 60, loss = 0.0128 Iteration 80, loss = 0.0269 --- Epoch 393 / 100000 Iteration 0, loss = 0.0155 Iteration 20, loss = 0.0275 Iteration 40, loss = 0.0184 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0179 --- Epoch 394 / 100000 Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0205 Iteration 40, loss = 0.0173 Iteration 60, loss = 0.0278 Iteration 80, loss = 0.0695 --- Epoch 395 / 100000 Iteration 0, loss = 0.0172 Iteration 20, loss = 0.0136 Iteration 40, loss = 0.0155 Iteration 60, loss = 0.0184 Iteration 80, loss = 0.0147 --- Epoch 396 / 100000 Iteration 0, loss = 0.0136 Iteration 20, loss = 0.0214 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0228 Iteration 80, loss = 0.0153 --- Epoch 397 / 100000 Iteration 0, loss = 0.0355 Iteration 20, loss = 0.0160 Iteration 40, loss = 0.0347 Iteration 60, loss = 0.0134 Iteration 80, loss = 0.0088 --- Epoch 398 / 100000 Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0138 Iteration 40, loss = 0.0197 Iteration 60, loss = 0.0218 Iteration 80, loss = 0.0249 --- Epoch 399 / 100000 Iteration 0, loss = 0.0217 Iteration 20, loss = 0.0366 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0176 Iteration 80, loss = 0.0122 --- Epoch 400 / 100000 Iteration 0, loss = 0.0145 Iteration 20, loss = 0.0167 Iteration 40, loss = 0.0120 Iteration 60, loss = 0.0291 Iteration 80, loss = 0.0145 --- Epoch 401 / 100000 Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0200 Iteration 40, loss = 0.0188 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0305 --- Epoch 402 / 100000 Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0215 Iteration 40, loss = 0.0242 Iteration 60, loss = 0.0136 Iteration 80, loss = 0.0164 --- Epoch 403 / 100000 Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0230 Iteration 40, loss = 0.0242 Iteration 60, loss = 0.0151 Iteration 80, loss = 0.0315 --- Epoch 404 / 100000 Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0185 Iteration 80, loss = 0.0122 --- Epoch 405 / 100000 Iteration 0, loss = 0.0269 Iteration 20, loss = 0.0252 Iteration 40, loss = 0.0097 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0179 --- Epoch 406 / 100000 Iteration 0, loss = 0.0161 Iteration 20, loss = 0.0418 Iteration 40, loss = 0.0218 Iteration 60, loss = 0.0163 Iteration 80, loss = 0.0153 --- Epoch 407 / 100000 Iteration 0, loss = 0.0161 Iteration 20, loss = 0.0165 Iteration 40, loss = 0.0298 Iteration 60, loss = 0.0225 Iteration 80, loss = 0.0206 --- Epoch 408 / 100000 Iteration 0, loss = 0.0160 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0214 Iteration 60, loss = 0.0237 Iteration 80, loss = 0.0137 --- Epoch 409 / 100000 Iteration 0, loss = 0.0163 Iteration 20, loss = 0.0401 Iteration 40, loss = 0.0120 Iteration 60, loss = 0.0140 Iteration 80, loss = 0.0118 --- Epoch 410 / 100000 Iteration 0, loss = 0.0165 Iteration 20, loss = 0.0385 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0164 --- Epoch 411 / 100000 Iteration 0, loss = 0.0293 Iteration 20, loss = 0.0213 Iteration 40, loss = 0.0363 Iteration 60, loss = 0.0120 Iteration 80, loss = 0.0143 --- Epoch 412 / 100000 Iteration 0, loss = 0.0225 Iteration 20, loss = 0.0174 Iteration 40, loss = 0.0160 Iteration 60, loss = 0.0177 Iteration 80, loss = 0.0118 --- Epoch 413 / 100000 Iteration 0, loss = 0.0401 Iteration 20, loss = 0.0250 Iteration 40, loss = 0.0173 Iteration 60, loss = 0.0154 Iteration 80, loss = 0.0183 --- Epoch 414 / 100000 Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0176 Iteration 40, loss = 0.0163 Iteration 60, loss = 0.0150 Iteration 80, loss = 0.0103 --- Epoch 415 / 100000 Iteration 0, loss = 0.0212 Iteration 20, loss = 0.0343 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0183 Iteration 80, loss = 0.0162 --- Epoch 416 / 100000 Iteration 0, loss = 0.0136 Iteration 20, loss = 0.0156 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0134 Iteration 80, loss = 0.0094 --- Epoch 417 / 100000 Iteration 0, loss = 0.0154 Iteration 20, loss = 0.0153 Iteration 40, loss = 0.0150 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0117 --- Epoch 418 / 100000 Iteration 0, loss = 0.0136 Iteration 20, loss = 0.0190 Iteration 40, loss = 0.0185 Iteration 60, loss = 0.0193 Iteration 80, loss = 0.0423 --- Epoch 419 / 100000 Iteration 0, loss = 0.0129 Iteration 20, loss = 0.0126 Iteration 40, loss = 0.0161 Iteration 60, loss = 0.0350 Iteration 80, loss = 0.0222 --- Epoch 420 / 100000 Iteration 0, loss = 0.0192 Iteration 20, loss = 0.0157 Iteration 40, loss = 0.0155 Iteration 60, loss = 0.0293 Iteration 80, loss = 0.0338 --- Epoch 421 / 100000 Iteration 0, loss = 0.0224 Iteration 20, loss = 0.0416 Iteration 40, loss = 0.0184 Iteration 60, loss = 0.0193 Iteration 80, loss = 0.0551 --- Epoch 422 / 100000 Iteration 0, loss = 0.0126 Iteration 20, loss = 0.0160 Iteration 40, loss = 0.0108 Iteration 60, loss = 0.0333 Iteration 80, loss = 0.0333 --- Epoch 423 / 100000 Iteration 0, loss = 0.0147 Iteration 20, loss = 0.0236 Iteration 40, loss = 0.0154 Iteration 60, loss = 0.0169 Iteration 80, loss = 0.0137 --- Epoch 424 / 100000 Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0253 Iteration 60, loss = 0.0187 Iteration 80, loss = 0.0219 --- Epoch 425 / 100000 Iteration 0, loss = 0.0129 Iteration 20, loss = 0.0491 Iteration 40, loss = 0.0204 Iteration 60, loss = 0.0168 Iteration 80, loss = 0.0156 --- Epoch 426 / 100000 Iteration 0, loss = 0.0202 Iteration 20, loss = 0.0567 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0153 Iteration 80, loss = 0.0102 --- Epoch 427 / 100000 Iteration 0, loss = 0.0240 Iteration 20, loss = 0.0322 Iteration 40, loss = 0.0495 Iteration 60, loss = 0.0305 Iteration 80, loss = 0.0118 --- Epoch 428 / 100000 Iteration 0, loss = 0.0141 Iteration 20, loss = 0.0090 Iteration 40, loss = 0.0204 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0138 --- Epoch 429 / 100000 Iteration 0, loss = 0.0120 Iteration 20, loss = 0.0160 Iteration 40, loss = 0.0237 Iteration 60, loss = 0.0146 Iteration 80, loss = 0.0098 --- Epoch 430 / 100000 Iteration 0, loss = 0.0135 Iteration 20, loss = 0.0142 Iteration 40, loss = 0.0219 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0083 --- Epoch 431 / 100000 Iteration 0, loss = 0.0186 Iteration 20, loss = 0.0258 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0209 Iteration 80, loss = 0.0248 --- Epoch 432 / 100000 Iteration 0, loss = 0.0209 Iteration 20, loss = 0.0305 Iteration 40, loss = 0.0112 Iteration 60, loss = 0.0188 Iteration 80, loss = 0.0102 --- Epoch 433 / 100000 Iteration 0, loss = 0.0129 Iteration 20, loss = 0.0157 Iteration 40, loss = 0.0215 Iteration 60, loss = 0.0175 Iteration 80, loss = 0.0255 --- Epoch 434 / 100000 Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0240 Iteration 40, loss = 0.0157 Iteration 60, loss = 0.0209 Iteration 80, loss = 0.0151 --- Epoch 435 / 100000 Iteration 0, loss = 0.0213 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0102 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0205 --- Epoch 436 / 100000 Iteration 0, loss = 0.0255 Iteration 20, loss = 0.0184 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0196 Iteration 80, loss = 0.0290 --- Epoch 437 / 100000 Iteration 0, loss = 0.0083 Iteration 20, loss = 0.0142 Iteration 40, loss = 0.0156 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0097 --- Epoch 438 / 100000 Iteration 0, loss = 0.0168 Iteration 20, loss = 0.0167 Iteration 40, loss = 0.0198 Iteration 60, loss = 0.0320 Iteration 80, loss = 0.0286 --- Epoch 439 / 100000 Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0263 Iteration 40, loss = 0.0078 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0160 --- Epoch 440 / 100000 Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0277 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0140 Iteration 80, loss = 0.0312 --- Epoch 441 / 100000 Iteration 0, loss = 0.0164 Iteration 20, loss = 0.0183 Iteration 40, loss = 0.0161 Iteration 60, loss = 0.0178 Iteration 80, loss = 0.0232 --- Epoch 442 / 100000 Iteration 0, loss = 0.0209 Iteration 20, loss = 0.0226 Iteration 40, loss = 0.0171 Iteration 60, loss = 0.0367 Iteration 80, loss = 0.0121 --- Epoch 443 / 100000 Iteration 0, loss = 0.0173 Iteration 20, loss = 0.0141 Iteration 40, loss = 0.0180 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0252 --- Epoch 444 / 100000 Iteration 0, loss = 0.0169 Iteration 20, loss = 0.0111 Iteration 40, loss = 0.0177 Iteration 60, loss = 0.0256 Iteration 80, loss = 0.0089 --- Epoch 445 / 100000 Iteration 0, loss = 0.0130 Iteration 20, loss = 0.0182 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0144 Iteration 80, loss = 0.0206 --- Epoch 446 / 100000 Iteration 0, loss = 0.0144 Iteration 20, loss = 0.0130 Iteration 40, loss = 0.0132 Iteration 60, loss = 0.0235 Iteration 80, loss = 0.0122 --- Epoch 447 / 100000 Iteration 0, loss = 0.0138 Iteration 20, loss = 0.0152 Iteration 40, loss = 0.0683 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0289 --- Epoch 448 / 100000 Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0112 Iteration 60, loss = 0.0248 Iteration 80, loss = 0.0295 --- Epoch 449 / 100000 Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0296 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0146 Iteration 80, loss = 0.0166 --- Epoch 450 / 100000 Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0140 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0092 --- Epoch 451 / 100000 Iteration 0, loss = 0.0120 Iteration 20, loss = 0.0174 Iteration 40, loss = 0.0142 Iteration 60, loss = 0.0163 Iteration 80, loss = 0.0466 --- Epoch 452 / 100000 Iteration 0, loss = 0.0236 Iteration 20, loss = 0.0208 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0392 Iteration 80, loss = 0.0374 --- Epoch 453 / 100000 Iteration 0, loss = 0.0205 Iteration 20, loss = 0.0117 Iteration 40, loss = 0.0183 Iteration 60, loss = 0.0139 Iteration 80, loss = 0.0364 --- Epoch 454 / 100000 Iteration 0, loss = 0.0177 Iteration 20, loss = 0.0160 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0340 Iteration 80, loss = 0.0151 --- Epoch 455 / 100000 Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0090 Iteration 40, loss = 0.0163 Iteration 60, loss = 0.0370 Iteration 80, loss = 0.0154 --- Epoch 456 / 100000 Iteration 0, loss = 0.0211 Iteration 20, loss = 0.0099 Iteration 40, loss = 0.0272 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0141 --- Epoch 457 / 100000 Iteration 0, loss = 0.0148 Iteration 20, loss = 0.0141 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0178 Iteration 80, loss = 0.0315 --- Epoch 458 / 100000 Iteration 0, loss = 0.0155 Iteration 20, loss = 0.0252 Iteration 40, loss = 0.0165 Iteration 60, loss = 0.0160 Iteration 80, loss = 0.0102 --- Epoch 459 / 100000 Iteration 0, loss = 0.0163 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0233 --- Epoch 460 / 100000 Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0169 Iteration 40, loss = 0.0145 Iteration 60, loss = 0.0147 Iteration 80, loss = 0.0226 --- Epoch 461 / 100000 Iteration 0, loss = 0.0298 Iteration 20, loss = 0.0283 Iteration 40, loss = 0.0169 Iteration 60, loss = 0.0151 Iteration 80, loss = 0.0165 --- Epoch 462 / 100000 Iteration 0, loss = 0.0146 Iteration 20, loss = 0.0234 Iteration 40, loss = 0.0141 Iteration 60, loss = 0.0228 Iteration 80, loss = 0.0141 --- Epoch 463 / 100000 Iteration 0, loss = 0.0171 Iteration 20, loss = 0.0115 Iteration 40, loss = 0.0212 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0239 --- Epoch 464 / 100000 Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0142 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0117 Iteration 80, loss = 0.0099 --- Epoch 465 / 100000 Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0223 Iteration 40, loss = 0.0093 Iteration 60, loss = 0.0164 Iteration 80, loss = 0.0221 --- Epoch 466 / 100000 Iteration 0, loss = 0.0223 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0164 Iteration 60, loss = 0.0123 Iteration 80, loss = 0.0260 --- Epoch 467 / 100000 Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0184 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0165 Iteration 80, loss = 0.0112 --- Epoch 468 / 100000 Iteration 0, loss = 0.0300 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0126 Iteration 60, loss = 0.0227 Iteration 80, loss = 0.0168 --- Epoch 469 / 100000 Iteration 0, loss = 0.0124 Iteration 20, loss = 0.0144 Iteration 40, loss = 0.0179 Iteration 60, loss = 0.0162 Iteration 80, loss = 0.0116 --- Epoch 470 / 100000 Iteration 0, loss = 0.0193 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0270 Iteration 60, loss = 0.0225 Iteration 80, loss = 0.0073 --- Epoch 471 / 100000 Iteration 0, loss = 0.0150 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0145 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0138 --- Epoch 472 / 100000 Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0158 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0189 --- Epoch 473 / 100000 Iteration 0, loss = 0.0198 Iteration 20, loss = 0.0256 Iteration 40, loss = 0.0198 Iteration 60, loss = 0.0171 Iteration 80, loss = 0.0167 --- Epoch 474 / 100000 Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0302 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0090 --- Epoch 475 / 100000 Iteration 0, loss = 0.0131 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0269 Iteration 60, loss = 0.0203 Iteration 80, loss = 0.0296 --- Epoch 476 / 100000 Iteration 0, loss = 0.0193 Iteration 20, loss = 0.0174 Iteration 40, loss = 0.0235 Iteration 60, loss = 0.0141 Iteration 80, loss = 0.0119 --- Epoch 477 / 100000 Iteration 0, loss = 0.0181 Iteration 20, loss = 0.0162 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0147 Iteration 80, loss = 0.0138 --- Epoch 478 / 100000 Iteration 0, loss = 0.0240 Iteration 20, loss = 0.0149 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0180 Iteration 80, loss = 0.0255 --- Epoch 479 / 100000 Iteration 0, loss = 0.0103 Iteration 20, loss = 0.0138 Iteration 40, loss = 0.0157 Iteration 60, loss = 0.0130 Iteration 80, loss = 0.0184 --- Epoch 480 / 100000 Iteration 0, loss = 0.0378 Iteration 20, loss = 0.0130 Iteration 40, loss = 0.0187 Iteration 60, loss = 0.0099 Iteration 80, loss = 0.0140 --- Epoch 481 / 100000 Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0265 Iteration 40, loss = 0.0238 Iteration 60, loss = 0.0151 Iteration 80, loss = 0.0229 --- Epoch 482 / 100000 Iteration 0, loss = 0.0140 Iteration 20, loss = 0.0198 Iteration 40, loss = 0.0273 Iteration 60, loss = 0.0189 Iteration 80, loss = 0.0219 --- Epoch 483 / 100000 Iteration 0, loss = 0.0140 Iteration 20, loss = 0.0109 Iteration 40, loss = 0.0156 Iteration 60, loss = 0.0228 Iteration 80, loss = 0.0102 --- Epoch 484 / 100000 Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0181 Iteration 80, loss = 0.0344 --- Epoch 485 / 100000 Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0154 Iteration 40, loss = 0.0240 Iteration 60, loss = 0.0281 Iteration 80, loss = 0.0184 --- Epoch 486 / 100000 Iteration 0, loss = 0.0145 Iteration 20, loss = 0.0176 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0278 Iteration 80, loss = 0.0152 --- Epoch 487 / 100000 Iteration 0, loss = 0.0166 Iteration 20, loss = 0.0142 Iteration 40, loss = 0.0144 Iteration 60, loss = 0.0159 Iteration 80, loss = 0.0219 --- Epoch 488 / 100000 Iteration 0, loss = 0.0193 Iteration 20, loss = 0.0452 Iteration 40, loss = 0.0147 Iteration 60, loss = 0.0157 Iteration 80, loss = 0.0186 --- Epoch 489 / 100000 Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0208 Iteration 40, loss = 0.0151 Iteration 60, loss = 0.0156 Iteration 80, loss = 0.0140 --- Epoch 490 / 100000 Iteration 0, loss = 0.0155 Iteration 20, loss = 0.0292 Iteration 40, loss = 0.0241 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0104 --- Epoch 491 / 100000 Iteration 0, loss = 0.0150 Iteration 20, loss = 0.0151 Iteration 40, loss = 0.0102 Iteration 60, loss = 0.0315 Iteration 80, loss = 0.0228 --- Epoch 492 / 100000 Iteration 0, loss = 0.0165 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0146 Iteration 80, loss = 0.0168 --- Epoch 493 / 100000 Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0403 Iteration 40, loss = 0.0112 Iteration 60, loss = 0.0174 Iteration 80, loss = 0.0131 --- Epoch 494 / 100000 Iteration 0, loss = 0.0318 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0102 Iteration 60, loss = 0.0250 Iteration 80, loss = 0.0122 --- Epoch 495 / 100000 Iteration 0, loss = 0.0144 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0246 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0272 --- Epoch 496 / 100000 Iteration 0, loss = 0.0237 Iteration 20, loss = 0.0136 Iteration 40, loss = 0.0164 Iteration 60, loss = 0.0210 Iteration 80, loss = 0.0198 --- Epoch 497 / 100000 Iteration 0, loss = 0.0164 Iteration 20, loss = 0.0137 Iteration 40, loss = 0.0200 Iteration 60, loss = 0.0153 Iteration 80, loss = 0.0397 --- Epoch 498 / 100000 Iteration 0, loss = 0.0227 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0097 Iteration 60, loss = 0.0182 Iteration 80, loss = 0.0153 --- Epoch 499 / 100000 Iteration 0, loss = 0.0196 Iteration 20, loss = 0.0161 Iteration 40, loss = 0.0181 Iteration 60, loss = 0.0184 Iteration 80, loss = 0.0283 --- Epoch 500 / 100000 Iteration 0, loss = 0.0173 Iteration 20, loss = 0.0285 Iteration 40, loss = 0.0156 Iteration 60, loss = 0.0172 Iteration 80, loss = 0.0166 --- Epoch 501 / 100000 Iteration 0, loss = 0.0139 Iteration 20, loss = 0.0196 Iteration 40, loss = 0.0135 Iteration 60, loss = 0.0169 Iteration 80, loss = 0.0102 --- Epoch 502 / 100000 Iteration 0, loss = 0.0172 Iteration 20, loss = 0.0169 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0147 Iteration 80, loss = 0.0506 --- Epoch 503 / 100000 Iteration 0, loss = 0.0139 Iteration 20, loss = 0.0272 Iteration 40, loss = 0.0237 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0079 --- Epoch 504 / 100000 Iteration 0, loss = 0.0388 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0154 Iteration 60, loss = 0.0137 Iteration 80, loss = 0.0264 --- Epoch 505 / 100000 Iteration 0, loss = 0.0171 Iteration 20, loss = 0.0265 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0169 Iteration 80, loss = 0.0155 --- Epoch 506 / 100000 Iteration 0, loss = 0.0268 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0128 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0220 --- Epoch 507 / 100000 Iteration 0, loss = 0.0131 Iteration 20, loss = 0.0129 Iteration 40, loss = 0.0188 Iteration 60, loss = 0.0200 Iteration 80, loss = 0.0459 --- Epoch 508 / 100000 Iteration 0, loss = 0.0207 Iteration 20, loss = 0.0171 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0163 --- Epoch 509 / 100000 Iteration 0, loss = 0.0340 Iteration 20, loss = 0.0196 Iteration 40, loss = 0.0203 Iteration 60, loss = 0.0215 Iteration 80, loss = 0.0229 --- Epoch 510 / 100000 Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0139 Iteration 60, loss = 0.0165 Iteration 80, loss = 0.0223 --- Epoch 511 / 100000 Iteration 0, loss = 0.0473 Iteration 20, loss = 0.0231 Iteration 40, loss = 0.0227 Iteration 60, loss = 0.0334 Iteration 80, loss = 0.0215 --- Epoch 512 / 100000 Iteration 0, loss = 0.0200 Iteration 20, loss = 0.0149 Iteration 40, loss = 0.0158 Iteration 60, loss = 0.0189 Iteration 80, loss = 0.0278 --- Epoch 513 / 100000 Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0282 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0178 --- Epoch 514 / 100000 Iteration 0, loss = 0.0129 Iteration 20, loss = 0.0243 Iteration 40, loss = 0.0345 Iteration 60, loss = 0.0102 Iteration 80, loss = 0.0137 --- Epoch 515 / 100000 Iteration 0, loss = 0.0196 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0154 Iteration 60, loss = 0.0275 Iteration 80, loss = 0.0142 --- Epoch 516 / 100000 Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0236 Iteration 40, loss = 0.0245 Iteration 60, loss = 0.0229 Iteration 80, loss = 0.0159 --- Epoch 517 / 100000 Iteration 0, loss = 0.0164 Iteration 20, loss = 0.0178 Iteration 40, loss = 0.0097 Iteration 60, loss = 0.0253 Iteration 80, loss = 0.0140 --- Epoch 518 / 100000 Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0191 Iteration 40, loss = 0.0146 Iteration 60, loss = 0.0241 Iteration 80, loss = 0.0144 --- Epoch 519 / 100000 Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0263 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0182 Iteration 80, loss = 0.0117 --- Epoch 520 / 100000 Iteration 0, loss = 0.0140 Iteration 20, loss = 0.0157 Iteration 40, loss = 0.0120 Iteration 60, loss = 0.0141 Iteration 80, loss = 0.0092 --- Epoch 521 / 100000 Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0147 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0189 --- Epoch 522 / 100000 Iteration 0, loss = 0.0152 Iteration 20, loss = 0.0142 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0130 Iteration 80, loss = 0.0188 --- Epoch 523 / 100000 Iteration 0, loss = 0.0145 Iteration 20, loss = 0.0153 Iteration 40, loss = 0.0222 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0186 --- Epoch 524 / 100000 Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0244 Iteration 60, loss = 0.0131 Iteration 80, loss = 0.0113 --- Epoch 525 / 100000 Iteration 0, loss = 0.0171 Iteration 20, loss = 0.0155 Iteration 40, loss = 0.0124 Iteration 60, loss = 0.0167 Iteration 80, loss = 0.0272 --- Epoch 526 / 100000 Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0120 Iteration 60, loss = 0.0322 Iteration 80, loss = 0.0362 --- Epoch 527 / 100000 Iteration 0, loss = 0.0155 Iteration 20, loss = 0.0114 Iteration 40, loss = 0.0172 Iteration 60, loss = 0.0231 Iteration 80, loss = 0.0188 --- Epoch 528 / 100000 Iteration 0, loss = 0.0146 Iteration 20, loss = 0.0202 Iteration 40, loss = 0.0121 Iteration 60, loss = 0.0189 Iteration 80, loss = 0.0338 --- Epoch 529 / 100000 Iteration 0, loss = 0.0113 Iteration 20, loss = 0.0379 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0247 Iteration 80, loss = 0.0111 --- Epoch 530 / 100000 Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0160 Iteration 40, loss = 0.0160 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0151 --- Epoch 531 / 100000 Iteration 0, loss = 0.0202 Iteration 20, loss = 0.0100 Iteration 40, loss = 0.0145 Iteration 60, loss = 0.0215 Iteration 80, loss = 0.0171 --- Epoch 532 / 100000 Iteration 0, loss = 0.0138 Iteration 20, loss = 0.0249 Iteration 40, loss = 0.0303 Iteration 60, loss = 0.0396 Iteration 80, loss = 0.0184 --- Epoch 533 / 100000 Iteration 0, loss = 0.0140 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0147 Iteration 60, loss = 0.0175 Iteration 80, loss = 0.0088 --- Epoch 534 / 100000 Iteration 0, loss = 0.0159 Iteration 20, loss = 0.0191 Iteration 40, loss = 0.0136 Iteration 60, loss = 0.0130 Iteration 80, loss = 0.0146 --- Epoch 535 / 100000 Iteration 0, loss = 0.0133 Iteration 20, loss = 0.0152 Iteration 40, loss = 0.0321 Iteration 60, loss = 0.0162 Iteration 80, loss = 0.0336 --- Epoch 536 / 100000 Iteration 0, loss = 0.0104 Iteration 20, loss = 0.0261 Iteration 40, loss = 0.0128 Iteration 60, loss = 0.0133 Iteration 80, loss = 0.0194 --- Epoch 537 / 100000 Iteration 0, loss = 0.0260 Iteration 20, loss = 0.0475 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0169 --- Epoch 538 / 100000 Iteration 0, loss = 0.0135 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0246 Iteration 80, loss = 0.0264 --- Epoch 539 / 100000 Iteration 0, loss = 0.0169 Iteration 20, loss = 0.0312 Iteration 40, loss = 0.0182 Iteration 60, loss = 0.0247 Iteration 80, loss = 0.0132 --- Epoch 540 / 100000 Iteration 0, loss = 0.0218 Iteration 20, loss = 0.0134 Iteration 40, loss = 0.0244 Iteration 60, loss = 0.0175 Iteration 80, loss = 0.0159 --- Epoch 541 / 100000 Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0211 Iteration 40, loss = 0.0148 Iteration 60, loss = 0.0190 Iteration 80, loss = 0.0075 --- Epoch 542 / 100000 Iteration 0, loss = 0.0140 Iteration 20, loss = 0.0147 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0171 Iteration 80, loss = 0.0106 --- Epoch 543 / 100000 Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0185 Iteration 60, loss = 0.0181 Iteration 80, loss = 0.0119 --- Epoch 544 / 100000 Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0128 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0301 --- Epoch 545 / 100000 Iteration 0, loss = 0.0180 Iteration 20, loss = 0.0299 Iteration 40, loss = 0.0226 Iteration 60, loss = 0.0097 Iteration 80, loss = 0.0071 --- Epoch 546 / 100000 Iteration 0, loss = 0.0170 Iteration 20, loss = 0.0211 Iteration 40, loss = 0.0139 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0121 --- Epoch 547 / 100000 Iteration 0, loss = 0.0146 Iteration 20, loss = 0.0283 Iteration 40, loss = 0.0137 Iteration 60, loss = 0.0231 Iteration 80, loss = 0.0141 --- Epoch 548 / 100000 Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0371 Iteration 40, loss = 0.0189 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0246 --- Epoch 549 / 100000 Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0130 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0200 Iteration 80, loss = 0.0109 --- Epoch 550 / 100000 Iteration 0, loss = 0.0141 Iteration 20, loss = 0.0210 Iteration 40, loss = 0.0284 Iteration 60, loss = 0.0192 Iteration 80, loss = 0.0207 --- Epoch 551 / 100000 Iteration 0, loss = 0.0163 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0166 Iteration 60, loss = 0.0146 Iteration 80, loss = 0.0109 --- Epoch 552 / 100000 Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0166 Iteration 40, loss = 0.0135 Iteration 60, loss = 0.0154 Iteration 80, loss = 0.0099 --- Epoch 553 / 100000 Iteration 0, loss = 0.0195 Iteration 20, loss = 0.0190 Iteration 40, loss = 0.0325 Iteration 60, loss = 0.0307 Iteration 80, loss = 0.0207 --- Epoch 554 / 100000 Iteration 0, loss = 0.0141 Iteration 20, loss = 0.0202 Iteration 40, loss = 0.0106 Iteration 60, loss = 0.0198 Iteration 80, loss = 0.0140 --- Epoch 555 / 100000 Iteration 0, loss = 0.0208 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0182 Iteration 60, loss = 0.0199 Iteration 80, loss = 0.0107 --- Epoch 556 / 100000 Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0213 Iteration 40, loss = 0.0277 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0141 --- Epoch 557 / 100000 Iteration 0, loss = 0.0157 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0144 Iteration 60, loss = 0.0189 Iteration 80, loss = 0.0174 --- Epoch 558 / 100000 Iteration 0, loss = 0.0140 Iteration 20, loss = 0.0130 Iteration 40, loss = 0.0181 Iteration 60, loss = 0.0138 Iteration 80, loss = 0.0182 --- Epoch 559 / 100000 Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0126 Iteration 60, loss = 0.0116 Iteration 80, loss = 0.0151 --- Epoch 560 / 100000 Iteration 0, loss = 0.0233 Iteration 20, loss = 0.0196 Iteration 40, loss = 0.0181 Iteration 60, loss = 0.0134 Iteration 80, loss = 0.0156 --- Epoch 561 / 100000 Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0172 Iteration 40, loss = 0.0217 Iteration 60, loss = 0.0399 Iteration 80, loss = 0.0123 --- Epoch 562 / 100000 Iteration 0, loss = 0.0166 Iteration 20, loss = 0.0230 Iteration 40, loss = 0.0287 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0454 --- Epoch 563 / 100000 Iteration 0, loss = 0.0147 Iteration 20, loss = 0.0156 Iteration 40, loss = 0.0156 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0136 --- Epoch 564 / 100000 Iteration 0, loss = 0.0145 Iteration 20, loss = 0.0162 Iteration 40, loss = 0.0121 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0289 --- Epoch 565 / 100000 Iteration 0, loss = 0.0116 Iteration 20, loss = 0.0165 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0165 Iteration 80, loss = 0.0263 --- Epoch 566 / 100000 Iteration 0, loss = 0.0368 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0080 --- Epoch 567 / 100000 Iteration 0, loss = 0.0160 Iteration 20, loss = 0.0138 Iteration 40, loss = 0.0217 Iteration 60, loss = 0.0126 Iteration 80, loss = 0.0394 --- Epoch 568 / 100000 Iteration 0, loss = 0.0131 Iteration 20, loss = 0.0250 Iteration 40, loss = 0.0200 Iteration 60, loss = 0.0197 Iteration 80, loss = 0.0076 --- Epoch 569 / 100000 Iteration 0, loss = 0.0155 Iteration 20, loss = 0.0160 Iteration 40, loss = 0.0182 Iteration 60, loss = 0.0113 Iteration 80, loss = 0.0118 --- Epoch 570 / 100000 Iteration 0, loss = 0.0190 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0170 Iteration 60, loss = 0.0196 Iteration 80, loss = 0.0079 --- Epoch 571 / 100000 Iteration 0, loss = 0.0202 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0319 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0192 --- Epoch 572 / 100000 Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0096 Iteration 40, loss = 0.0183 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0089 --- Epoch 573 / 100000 Iteration 0, loss = 0.0232 Iteration 20, loss = 0.0245 Iteration 40, loss = 0.0126 Iteration 60, loss = 0.0130 Iteration 80, loss = 0.0161 --- Epoch 574 / 100000 Iteration 0, loss = 0.0235 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0331 Iteration 60, loss = 0.0160 Iteration 80, loss = 0.0272 --- Epoch 575 / 100000 Iteration 0, loss = 0.0201 Iteration 20, loss = 0.0138 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0152 Iteration 80, loss = 0.0118 --- Epoch 576 / 100000 Iteration 0, loss = 0.0180 Iteration 20, loss = 0.0475 Iteration 40, loss = 0.0267 Iteration 60, loss = 0.0131 Iteration 80, loss = 0.0261 --- Epoch 577 / 100000 Iteration 0, loss = 0.0202 Iteration 20, loss = 0.0160 Iteration 40, loss = 0.0105 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0120 --- Epoch 578 / 100000 Iteration 0, loss = 0.0123 Iteration 20, loss = 0.0256 Iteration 40, loss = 0.0092 Iteration 60, loss = 0.0202 Iteration 80, loss = 0.0170 --- Epoch 579 / 100000 Iteration 0, loss = 0.0222 Iteration 20, loss = 0.0192 Iteration 40, loss = 0.0112 Iteration 60, loss = 0.0384 Iteration 80, loss = 0.0200 --- Epoch 580 / 100000 Iteration 0, loss = 0.0152 Iteration 20, loss = 0.0141 Iteration 40, loss = 0.0120 Iteration 60, loss = 0.0148 Iteration 80, loss = 0.0187 --- Epoch 581 / 100000 Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0085 Iteration 40, loss = 0.0195 Iteration 60, loss = 0.0228 Iteration 80, loss = 0.0111 --- Epoch 582 / 100000 Iteration 0, loss = 0.0146 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0148 Iteration 60, loss = 0.0206 Iteration 80, loss = 0.0131 --- Epoch 583 / 100000 Iteration 0, loss = 0.0138 Iteration 20, loss = 0.0173 Iteration 40, loss = 0.0185 Iteration 60, loss = 0.0113 Iteration 80, loss = 0.0209 --- Epoch 584 / 100000 Iteration 0, loss = 0.0290 Iteration 20, loss = 0.0124 Iteration 40, loss = 0.0208 Iteration 60, loss = 0.0126 Iteration 80, loss = 0.0183 --- Epoch 585 / 100000 Iteration 0, loss = 0.0205 Iteration 20, loss = 0.0117 Iteration 40, loss = 0.0139 Iteration 60, loss = 0.0275 Iteration 80, loss = 0.0269 --- Epoch 586 / 100000 Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0402 Iteration 40, loss = 0.0198 Iteration 60, loss = 0.0130 Iteration 80, loss = 0.0093 --- Epoch 587 / 100000 Iteration 0, loss = 0.0165 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0145 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0220 --- Epoch 588 / 100000 Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0200 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0150 Iteration 80, loss = 0.0109 --- Epoch 589 / 100000 Iteration 0, loss = 0.0149 Iteration 20, loss = 0.0140 Iteration 40, loss = 0.0350 Iteration 60, loss = 0.0150 Iteration 80, loss = 0.0262 --- Epoch 590 / 100000 Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0149 Iteration 40, loss = 0.0264 Iteration 60, loss = 0.0241 Iteration 80, loss = 0.0072 --- Epoch 591 / 100000 Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0124 Iteration 60, loss = 0.0181 Iteration 80, loss = 0.0141 --- Epoch 592 / 100000 Iteration 0, loss = 0.0103 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0112 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0156 --- Epoch 593 / 100000 Iteration 0, loss = 0.0162 Iteration 20, loss = 0.0166 Iteration 40, loss = 0.0169 Iteration 60, loss = 0.0218 Iteration 80, loss = 0.0096 --- Epoch 594 / 100000 Iteration 0, loss = 0.0146 Iteration 20, loss = 0.0232 Iteration 40, loss = 0.0188 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0148 --- Epoch 595 / 100000 Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0176 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0178 Iteration 80, loss = 0.0093 --- Epoch 596 / 100000 Iteration 0, loss = 0.0215 Iteration 20, loss = 0.0207 Iteration 40, loss = 0.0137 Iteration 60, loss = 0.0177 Iteration 80, loss = 0.0252 --- Epoch 597 / 100000 Iteration 0, loss = 0.0161 Iteration 20, loss = 0.0447 Iteration 40, loss = 0.0163 Iteration 60, loss = 0.0169 Iteration 80, loss = 0.0214 --- Epoch 598 / 100000 Iteration 0, loss = 0.0257 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0170 Iteration 60, loss = 0.0102 Iteration 80, loss = 0.0096 --- Epoch 599 / 100000 Iteration 0, loss = 0.0149 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0113 Iteration 60, loss = 0.0190 Iteration 80, loss = 0.0212 --- Epoch 600 / 100000 Iteration 0, loss = 0.0137 Iteration 20, loss = 0.0286 Iteration 40, loss = 0.0294 Iteration 60, loss = 0.0140 Iteration 80, loss = 0.0211 --- Epoch 601 / 100000 Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0259 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0177 Iteration 80, loss = 0.0204 --- Epoch 602 / 100000 Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0130 Iteration 40, loss = 0.0162 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0209 --- Epoch 603 / 100000 Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0187 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0191 Iteration 80, loss = 0.0097 --- Epoch 604 / 100000 Iteration 0, loss = 0.0166 Iteration 20, loss = 0.0207 Iteration 40, loss = 0.0287 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0137 --- Epoch 605 / 100000 Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0140 Iteration 40, loss = 0.0132 Iteration 60, loss = 0.0189 Iteration 80, loss = 0.0085 --- Epoch 606 / 100000 Iteration 0, loss = 0.0144 Iteration 20, loss = 0.0154 Iteration 40, loss = 0.0139 Iteration 60, loss = 0.0135 Iteration 80, loss = 0.0192 --- Epoch 607 / 100000 Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0290 Iteration 80, loss = 0.0200 --- Epoch 608 / 100000 Iteration 0, loss = 0.0138 Iteration 20, loss = 0.0177 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0097 Iteration 80, loss = 0.0108 --- Epoch 609 / 100000 Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0215 Iteration 40, loss = 0.0266 Iteration 60, loss = 0.0206 Iteration 80, loss = 0.0112 --- Epoch 610 / 100000 Iteration 0, loss = 0.0655 Iteration 20, loss = 0.0145 Iteration 40, loss = 0.0157 Iteration 60, loss = 0.0192 Iteration 80, loss = 0.0088 --- Epoch 611 / 100000 Iteration 0, loss = 0.0383 Iteration 20, loss = 0.0351 Iteration 40, loss = 0.0173 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0160 --- Epoch 612 / 100000 Iteration 0, loss = 0.0168 Iteration 20, loss = 0.0151 Iteration 40, loss = 0.0118 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0119 --- Epoch 613 / 100000 Iteration 0, loss = 0.0179 Iteration 20, loss = 0.0243 Iteration 40, loss = 0.0155 Iteration 60, loss = 0.0187 Iteration 80, loss = 0.0166 --- Epoch 614 / 100000 Iteration 0, loss = 0.0101 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0215 Iteration 80, loss = 0.0118 --- Epoch 615 / 100000 Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0086 Iteration 40, loss = 0.0267 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0121 --- Epoch 616 / 100000 Iteration 0, loss = 0.0135 Iteration 20, loss = 0.0166 Iteration 40, loss = 0.0195 Iteration 60, loss = 0.0210 Iteration 80, loss = 0.0180 --- Epoch 617 / 100000 Iteration 0, loss = 0.0276 Iteration 20, loss = 0.0178 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0143 Iteration 80, loss = 0.0121 --- Epoch 618 / 100000 Iteration 0, loss = 0.0182 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0223 Iteration 60, loss = 0.0152 Iteration 80, loss = 0.0182 --- Epoch 619 / 100000 Iteration 0, loss = 0.0207 Iteration 20, loss = 0.0126 Iteration 40, loss = 0.0120 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0225 --- Epoch 620 / 100000 Iteration 0, loss = 0.0151 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0473 Iteration 80, loss = 0.0171 --- Epoch 621 / 100000 Iteration 0, loss = 0.0139 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0148 --- Epoch 622 / 100000 Iteration 0, loss = 0.0250 Iteration 20, loss = 0.0333 Iteration 40, loss = 0.0175 Iteration 60, loss = 0.0216 Iteration 80, loss = 0.0229 --- Epoch 623 / 100000 Iteration 0, loss = 0.0182 Iteration 20, loss = 0.0171 Iteration 40, loss = 0.0154 Iteration 60, loss = 0.0111 Iteration 80, loss = 0.0131 --- Epoch 624 / 100000 Iteration 0, loss = 0.0147 Iteration 20, loss = 0.0475 Iteration 40, loss = 0.0222 Iteration 60, loss = 0.0131 Iteration 80, loss = 0.0141 --- Epoch 625 / 100000 Iteration 0, loss = 0.0322 Iteration 20, loss = 0.0131 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0143 --- Epoch 626 / 100000 Iteration 0, loss = 0.0273 Iteration 20, loss = 0.0187 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0152 --- Epoch 627 / 100000 Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0090 Iteration 40, loss = 0.0181 Iteration 60, loss = 0.0315 Iteration 80, loss = 0.0144 --- Epoch 628 / 100000 Iteration 0, loss = 0.0176 Iteration 20, loss = 0.0277 Iteration 40, loss = 0.0129 Iteration 60, loss = 0.0083 Iteration 80, loss = 0.0089 --- Epoch 629 / 100000 Iteration 0, loss = 0.0254 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0434 Iteration 60, loss = 0.0195 Iteration 80, loss = 0.0172 --- Epoch 630 / 100000 Iteration 0, loss = 0.0163 Iteration 20, loss = 0.0175 Iteration 40, loss = 0.0448 Iteration 60, loss = 0.0313 Iteration 80, loss = 0.0222 --- Epoch 631 / 100000 Iteration 0, loss = 0.0200 Iteration 20, loss = 0.0227 Iteration 40, loss = 0.0128 Iteration 60, loss = 0.0298 Iteration 80, loss = 0.0129 --- Epoch 632 / 100000 Iteration 0, loss = 0.0201 Iteration 20, loss = 0.0245 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0268 Iteration 80, loss = 0.0098 --- Epoch 633 / 100000 Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0111 Iteration 40, loss = 0.0194 Iteration 60, loss = 0.0274 Iteration 80, loss = 0.0185 --- Epoch 634 / 100000 Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0425 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0107 --- Epoch 635 / 100000 Iteration 0, loss = 0.0167 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0204 Iteration 60, loss = 0.0154 Iteration 80, loss = 0.0093 --- Epoch 636 / 100000 Iteration 0, loss = 0.0190 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0088 Iteration 60, loss = 0.0133 Iteration 80, loss = 0.0099 --- Epoch 637 / 100000 Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0161 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0132 Iteration 80, loss = 0.0217 --- Epoch 638 / 100000 Iteration 0, loss = 0.0157 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0126 Iteration 80, loss = 0.0114 --- Epoch 639 / 100000 Iteration 0, loss = 0.0110 Iteration 20, loss = 0.0090 Iteration 40, loss = 0.0164 Iteration 60, loss = 0.0229 Iteration 80, loss = 0.0731 --- Epoch 640 / 100000 Iteration 0, loss = 0.0197 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0113 Iteration 80, loss = 0.0167 --- Epoch 641 / 100000 Iteration 0, loss = 0.0124 Iteration 20, loss = 0.0171 Iteration 40, loss = 0.0105 Iteration 60, loss = 0.0154 Iteration 80, loss = 0.0167 --- Epoch 642 / 100000 Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0131 Iteration 60, loss = 0.0117 Iteration 80, loss = 0.0104 --- Epoch 643 / 100000 Iteration 0, loss = 0.0297 Iteration 20, loss = 0.0198 Iteration 40, loss = 0.0171 Iteration 60, loss = 0.0130 Iteration 80, loss = 0.0170 --- Epoch 644 / 100000 Iteration 0, loss = 0.0144 Iteration 20, loss = 0.0256 Iteration 40, loss = 0.0328 Iteration 60, loss = 0.0227 Iteration 80, loss = 0.0145 --- Epoch 645 / 100000 Iteration 0, loss = 0.0258 Iteration 20, loss = 0.0129 Iteration 40, loss = 0.0141 Iteration 60, loss = 0.0381 Iteration 80, loss = 0.0244 --- Epoch 646 / 100000 Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0145 Iteration 40, loss = 0.0190 Iteration 60, loss = 0.0115 Iteration 80, loss = 0.0249 --- Epoch 647 / 100000 Iteration 0, loss = 0.0161 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0180 Iteration 60, loss = 0.0114 Iteration 80, loss = 0.0101 --- Epoch 648 / 100000 Iteration 0, loss = 0.0206 Iteration 20, loss = 0.0176 Iteration 40, loss = 0.0171 Iteration 60, loss = 0.0120 Iteration 80, loss = 0.0114 --- Epoch 649 / 100000 Iteration 0, loss = 0.0181 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0161 Iteration 60, loss = 0.0258 Iteration 80, loss = 0.0181 --- Epoch 650 / 100000 Iteration 0, loss = 0.0202 Iteration 20, loss = 0.0163 Iteration 40, loss = 0.0300 Iteration 60, loss = 0.0478 Iteration 80, loss = 0.0100 --- Epoch 651 / 100000 Iteration 0, loss = 0.0116 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0194 Iteration 60, loss = 0.0141 Iteration 80, loss = 0.0082 --- Epoch 652 / 100000 Iteration 0, loss = 0.0144 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0252 Iteration 80, loss = 0.0164 --- Epoch 653 / 100000 Iteration 0, loss = 0.0157 Iteration 20, loss = 0.0128 Iteration 40, loss = 0.0188 Iteration 60, loss = 0.0134 Iteration 80, loss = 0.0331 --- Epoch 654 / 100000 Iteration 0, loss = 0.0224 Iteration 20, loss = 0.0205 Iteration 40, loss = 0.0150 Iteration 60, loss = 0.0158 Iteration 80, loss = 0.0141 --- Epoch 655 / 100000 Iteration 0, loss = 0.0202 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0220 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0539 --- Epoch 656 / 100000 Iteration 0, loss = 0.0124 Iteration 20, loss = 0.0152 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0127 Iteration 80, loss = 0.0116 --- Epoch 657 / 100000 Iteration 0, loss = 0.0368 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0202 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0159 --- Epoch 658 / 100000 Iteration 0, loss = 0.0198 Iteration 20, loss = 0.0151 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0149 --- Epoch 659 / 100000 Iteration 0, loss = 0.0113 Iteration 20, loss = 0.0357 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0238 Iteration 80, loss = 0.0167 --- Epoch 660 / 100000 Iteration 0, loss = 0.0145 Iteration 20, loss = 0.0269 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0192 Iteration 80, loss = 0.0145 --- Epoch 661 / 100000 Iteration 0, loss = 0.0200 Iteration 20, loss = 0.0086 Iteration 40, loss = 0.0247 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0115 --- Epoch 662 / 100000 Iteration 0, loss = 0.0120 Iteration 20, loss = 0.0134 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0209 Iteration 80, loss = 0.0208 --- Epoch 663 / 100000 Iteration 0, loss = 0.0183 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0162 Iteration 80, loss = 0.0141 --- Epoch 664 / 100000 Iteration 0, loss = 0.0110 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0300 Iteration 60, loss = 0.0192 Iteration 80, loss = 0.0147 --- Epoch 665 / 100000 Iteration 0, loss = 0.0272 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0307 Iteration 80, loss = 0.0146 --- Epoch 666 / 100000 Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0152 Iteration 40, loss = 0.0101 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0116 --- Epoch 667 / 100000 Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0111 Iteration 40, loss = 0.0309 Iteration 60, loss = 0.0124 Iteration 80, loss = 0.0225 --- Epoch 668 / 100000 Iteration 0, loss = 0.0209 Iteration 20, loss = 0.0177 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0108 Iteration 80, loss = 0.0464 --- Epoch 669 / 100000 Iteration 0, loss = 0.0293 Iteration 20, loss = 0.0340 Iteration 40, loss = 0.0175 Iteration 60, loss = 0.0205 Iteration 80, loss = 0.0121 --- Epoch 670 / 100000 Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0152 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0256 Iteration 80, loss = 0.0099 --- Epoch 671 / 100000 Iteration 0, loss = 0.0244 Iteration 20, loss = 0.0224 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0731 Iteration 80, loss = 0.0110 --- Epoch 672 / 100000 Iteration 0, loss = 0.0129 Iteration 20, loss = 0.0200 Iteration 40, loss = 0.0133 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0126 --- Epoch 673 / 100000 Iteration 0, loss = 0.0195 Iteration 20, loss = 0.0219 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0236 Iteration 80, loss = 0.0091 --- Epoch 674 / 100000 Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0153 Iteration 40, loss = 0.0167 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0162 --- Epoch 675 / 100000 Iteration 0, loss = 0.0103 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0162 Iteration 60, loss = 0.0208 Iteration 80, loss = 0.0165 --- Epoch 676 / 100000 Iteration 0, loss = 0.0152 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0492 Iteration 60, loss = 0.0242 Iteration 80, loss = 0.0179 --- Epoch 677 / 100000 Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0151 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0238 --- Epoch 678 / 100000 Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0159 Iteration 40, loss = 0.0172 Iteration 60, loss = 0.0185 Iteration 80, loss = 0.0143 --- Epoch 679 / 100000 Iteration 0, loss = 0.0209 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0153 Iteration 80, loss = 0.0293 --- Epoch 680 / 100000 Iteration 0, loss = 0.0147 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0176 Iteration 60, loss = 0.0179 Iteration 80, loss = 0.0142 --- Epoch 681 / 100000 Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0306 Iteration 40, loss = 0.0089 Iteration 60, loss = 0.0224 Iteration 80, loss = 0.0141 --- Epoch 682 / 100000 Iteration 0, loss = 0.0211 Iteration 20, loss = 0.0220 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0173 Iteration 80, loss = 0.0104 --- Epoch 683 / 100000 Iteration 0, loss = 0.0349 Iteration 20, loss = 0.0162 Iteration 40, loss = 0.0237 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0099 --- Epoch 684 / 100000 Iteration 0, loss = 0.0171 Iteration 20, loss = 0.0086 Iteration 40, loss = 0.0123 Iteration 60, loss = 0.0213 Iteration 80, loss = 0.0119 --- Epoch 685 / 100000 Iteration 0, loss = 0.0110 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0141 Iteration 80, loss = 0.0165 --- Epoch 686 / 100000 Iteration 0, loss = 0.0253 Iteration 20, loss = 0.0169 Iteration 40, loss = 0.0217 Iteration 60, loss = 0.0316 Iteration 80, loss = 0.0216 --- Epoch 687 / 100000 Iteration 0, loss = 0.0180 Iteration 20, loss = 0.0168 Iteration 40, loss = 0.0185 Iteration 60, loss = 0.0357 Iteration 80, loss = 0.0171 --- Epoch 688 / 100000 Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0129 Iteration 40, loss = 0.0172 Iteration 60, loss = 0.0126 Iteration 80, loss = 0.0133 --- Epoch 689 / 100000 Iteration 0, loss = 0.0255 Iteration 20, loss = 0.0100 Iteration 40, loss = 0.0172 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0134 --- Epoch 690 / 100000 Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0194 Iteration 40, loss = 0.0191 Iteration 60, loss = 0.0267 Iteration 80, loss = 0.0158 --- Epoch 691 / 100000 Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0307 Iteration 40, loss = 0.0118 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0176 --- Epoch 692 / 100000 Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0208 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0070 --- Epoch 693 / 100000 Iteration 0, loss = 0.0198 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0225 Iteration 80, loss = 0.0143 --- Epoch 694 / 100000 Iteration 0, loss = 0.0402 Iteration 20, loss = 0.0204 Iteration 40, loss = 0.0229 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0115 --- Epoch 695 / 100000 Iteration 0, loss = 0.0141 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0112 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0239 --- Epoch 696 / 100000 Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0378 Iteration 80, loss = 0.0139 --- Epoch 697 / 100000 Iteration 0, loss = 0.0146 Iteration 20, loss = 0.0112 Iteration 40, loss = 0.0183 Iteration 60, loss = 0.0152 Iteration 80, loss = 0.0114 --- Epoch 698 / 100000 Iteration 0, loss = 0.0131 Iteration 20, loss = 0.0142 Iteration 40, loss = 0.0147 Iteration 60, loss = 0.0189 Iteration 80, loss = 0.0195 --- Epoch 699 / 100000 Iteration 0, loss = 0.0148 Iteration 20, loss = 0.0194 Iteration 40, loss = 0.0257 Iteration 60, loss = 0.0124 Iteration 80, loss = 0.0190 --- Epoch 700 / 100000 Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0148 Iteration 40, loss = 0.0198 Iteration 60, loss = 0.0139 Iteration 80, loss = 0.0165 --- Epoch 701 / 100000 Iteration 0, loss = 0.0161 Iteration 20, loss = 0.0227 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0124 --- Epoch 702 / 100000 Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0147 --- Epoch 703 / 100000 Iteration 0, loss = 0.0138 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0158 Iteration 60, loss = 0.0351 Iteration 80, loss = 0.0118 --- Epoch 704 / 100000 Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0111 Iteration 40, loss = 0.0152 Iteration 60, loss = 0.0125 Iteration 80, loss = 0.0136 --- Epoch 705 / 100000 Iteration 0, loss = 0.0192 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0146 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0084 --- Epoch 706 / 100000 Iteration 0, loss = 0.0247 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0230 Iteration 80, loss = 0.0178 --- Epoch 707 / 100000 Iteration 0, loss = 0.0163 Iteration 20, loss = 0.0131 Iteration 40, loss = 0.0158 Iteration 60, loss = 0.0168 Iteration 80, loss = 0.0107 --- Epoch 708 / 100000 Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0222 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0243 Iteration 80, loss = 0.0182 --- Epoch 709 / 100000 Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0217 Iteration 60, loss = 0.0417 Iteration 80, loss = 0.0219 --- Epoch 710 / 100000 Iteration 0, loss = 0.0170 Iteration 20, loss = 0.0137 Iteration 40, loss = 0.0126 Iteration 60, loss = 0.0151 Iteration 80, loss = 0.0325 --- Epoch 711 / 100000 Iteration 0, loss = 0.0158 Iteration 20, loss = 0.0185 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0290 Iteration 80, loss = 0.0244 --- Epoch 712 / 100000 Iteration 0, loss = 0.0331 Iteration 20, loss = 0.0128 Iteration 40, loss = 0.0449 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0223 --- Epoch 713 / 100000 Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0115 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0117 Iteration 80, loss = 0.0136 --- Epoch 714 / 100000 Iteration 0, loss = 0.0144 Iteration 20, loss = 0.0241 Iteration 40, loss = 0.0166 Iteration 60, loss = 0.0130 Iteration 80, loss = 0.0106 --- Epoch 715 / 100000 Iteration 0, loss = 0.0150 Iteration 20, loss = 0.0156 Iteration 40, loss = 0.0140 Iteration 60, loss = 0.0139 Iteration 80, loss = 0.0209 --- Epoch 716 / 100000 Iteration 0, loss = 0.0204 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0162 Iteration 60, loss = 0.0150 Iteration 80, loss = 0.0129 --- Epoch 717 / 100000 Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0153 Iteration 60, loss = 0.0153 Iteration 80, loss = 0.0076 --- Epoch 718 / 100000 Iteration 0, loss = 0.0104 Iteration 20, loss = 0.0198 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0175 Iteration 80, loss = 0.0139 --- Epoch 719 / 100000 Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0176 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0143 Iteration 80, loss = 0.0156 --- Epoch 720 / 100000 Iteration 0, loss = 0.0177 Iteration 20, loss = 0.0112 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0292 Iteration 80, loss = 0.0148 --- Epoch 721 / 100000 Iteration 0, loss = 0.0210 Iteration 20, loss = 0.0100 Iteration 40, loss = 0.0101 Iteration 60, loss = 0.0192 Iteration 80, loss = 0.0200 --- Epoch 722 / 100000 Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0153 Iteration 40, loss = 0.0148 Iteration 60, loss = 0.0178 Iteration 80, loss = 0.0126 --- Epoch 723 / 100000 Iteration 0, loss = 0.0168 Iteration 20, loss = 0.0185 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0162 Iteration 80, loss = 0.0160 --- Epoch 724 / 100000 Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0093 Iteration 60, loss = 0.0202 Iteration 80, loss = 0.0068 --- Epoch 725 / 100000 Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0187 Iteration 40, loss = 0.0110 Iteration 60, loss = 0.0102 Iteration 80, loss = 0.0259 --- Epoch 726 / 100000 Iteration 0, loss = 0.0104 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0120 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0247 --- Epoch 727 / 100000 Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0106 Iteration 40, loss = 0.0137 Iteration 60, loss = 0.0208 Iteration 80, loss = 0.0225 --- Epoch 728 / 100000 Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0206 Iteration 80, loss = 0.0169 --- Epoch 729 / 100000 Iteration 0, loss = 0.0193 Iteration 20, loss = 0.0210 Iteration 40, loss = 0.0156 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0247 --- Epoch 730 / 100000 Iteration 0, loss = 0.0150 Iteration 20, loss = 0.0181 Iteration 40, loss = 0.0167 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0097 --- Epoch 731 / 100000 Iteration 0, loss = 0.0152 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0242 Iteration 80, loss = 0.0227 --- Epoch 732 / 100000 Iteration 0, loss = 0.0200 Iteration 20, loss = 0.0133 Iteration 40, loss = 0.0144 Iteration 60, loss = 0.0120 Iteration 80, loss = 0.0134 --- Epoch 733 / 100000 Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0196 Iteration 60, loss = 0.0209 Iteration 80, loss = 0.0230 --- Epoch 734 / 100000 Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0265 Iteration 40, loss = 0.0176 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0281 --- Epoch 735 / 100000 Iteration 0, loss = 0.0497 Iteration 20, loss = 0.0148 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0200 Iteration 80, loss = 0.0142 --- Epoch 736 / 100000 Iteration 0, loss = 0.0133 Iteration 20, loss = 0.0144 Iteration 40, loss = 0.0258 Iteration 60, loss = 0.0268 Iteration 80, loss = 0.0118 --- Epoch 737 / 100000 Iteration 0, loss = 0.0140 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0254 Iteration 80, loss = 0.0162 --- Epoch 738 / 100000 Iteration 0, loss = 0.0227 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0233 Iteration 80, loss = 0.0176 --- Epoch 739 / 100000 Iteration 0, loss = 0.0109 Iteration 20, loss = 0.0156 Iteration 40, loss = 0.0112 Iteration 60, loss = 0.0186 Iteration 80, loss = 0.0129 --- Epoch 740 / 100000 Iteration 0, loss = 0.0140 Iteration 20, loss = 0.0153 Iteration 40, loss = 0.0134 Iteration 60, loss = 0.0185 Iteration 80, loss = 0.0096 --- Epoch 741 / 100000 Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0185 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0103 --- Epoch 742 / 100000 Iteration 0, loss = 0.0233 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0443 Iteration 60, loss = 0.0248 Iteration 80, loss = 0.0105 --- Epoch 743 / 100000 Iteration 0, loss = 0.0127 Iteration 20, loss = 0.0115 Iteration 40, loss = 0.0239 Iteration 60, loss = 0.0101 Iteration 80, loss = 0.0196 --- Epoch 744 / 100000 Iteration 0, loss = 0.0182 Iteration 20, loss = 0.0142 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0179 Iteration 80, loss = 0.0209 --- Epoch 745 / 100000 Iteration 0, loss = 0.0155 Iteration 20, loss = 0.0198 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0232 Iteration 80, loss = 0.0089 --- Epoch 746 / 100000 Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0101 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0126 --- Epoch 747 / 100000 Iteration 0, loss = 0.0209 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0106 Iteration 60, loss = 0.0142 Iteration 80, loss = 0.0262 --- Epoch 748 / 100000 Iteration 0, loss = 0.0220 Iteration 20, loss = 0.0112 Iteration 40, loss = 0.0088 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0114 --- Epoch 749 / 100000 Iteration 0, loss = 0.0213 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0116 Iteration 80, loss = 0.0097 --- Epoch 750 / 100000 Iteration 0, loss = 0.0185 Iteration 20, loss = 0.0161 Iteration 40, loss = 0.0431 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0090 --- Epoch 751 / 100000 Iteration 0, loss = 0.0140 Iteration 20, loss = 0.0419 Iteration 40, loss = 0.0139 Iteration 60, loss = 0.0578 Iteration 80, loss = 0.0144 --- Epoch 752 / 100000 Iteration 0, loss = 0.0170 Iteration 20, loss = 0.0193 Iteration 40, loss = 0.0193 Iteration 60, loss = 0.0191 Iteration 80, loss = 0.0219 --- Epoch 753 / 100000 Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0239 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0114 Iteration 80, loss = 0.0424 --- Epoch 754 / 100000 Iteration 0, loss = 0.0208 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0084 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0176 --- Epoch 755 / 100000 Iteration 0, loss = 0.0266 Iteration 20, loss = 0.0165 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0183 Iteration 80, loss = 0.0245 --- Epoch 756 / 100000 Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0167 Iteration 40, loss = 0.0254 Iteration 60, loss = 0.0132 Iteration 80, loss = 0.0140 --- Epoch 757 / 100000 Iteration 0, loss = 0.0153 Iteration 20, loss = 0.0307 Iteration 40, loss = 0.0199 Iteration 60, loss = 0.0148 Iteration 80, loss = 0.0108 --- Epoch 758 / 100000 Iteration 0, loss = 0.0233 Iteration 20, loss = 0.0157 Iteration 40, loss = 0.0151 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0084 --- Epoch 759 / 100000 Iteration 0, loss = 0.0179 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0231 Iteration 60, loss = 0.0239 Iteration 80, loss = 0.0324 --- Epoch 760 / 100000 Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0142 Iteration 40, loss = 0.0336 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0138 --- Epoch 761 / 100000 Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0269 Iteration 40, loss = 0.0089 Iteration 60, loss = 0.0128 Iteration 80, loss = 0.0090 --- Epoch 762 / 100000 Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0267 Iteration 40, loss = 0.0120 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0198 --- Epoch 763 / 100000 Iteration 0, loss = 0.0288 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0242 Iteration 60, loss = 0.0382 Iteration 80, loss = 0.0124 --- Epoch 764 / 100000 Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0422 Iteration 40, loss = 0.0114 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0175 --- Epoch 765 / 100000 Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0144 Iteration 40, loss = 0.0153 Iteration 60, loss = 0.0231 Iteration 80, loss = 0.0148 --- Epoch 766 / 100000 Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0100 Iteration 40, loss = 0.0147 Iteration 60, loss = 0.0170 Iteration 80, loss = 0.0177 --- Epoch 767 / 100000 Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0155 Iteration 40, loss = 0.0089 Iteration 60, loss = 0.0141 Iteration 80, loss = 0.0307 --- Epoch 768 / 100000 Iteration 0, loss = 0.0153 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0218 Iteration 60, loss = 0.0167 Iteration 80, loss = 0.0130 --- Epoch 769 / 100000 Iteration 0, loss = 0.0166 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0165 Iteration 60, loss = 0.0193 Iteration 80, loss = 0.0125 --- Epoch 770 / 100000 Iteration 0, loss = 0.0217 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0204 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0132 --- Epoch 771 / 100000 Iteration 0, loss = 0.0244 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0159 Iteration 60, loss = 0.0114 Iteration 80, loss = 0.0284 --- Epoch 772 / 100000 Iteration 0, loss = 0.0131 Iteration 20, loss = 0.0150 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0114 Iteration 80, loss = 0.0118 --- Epoch 773 / 100000 Iteration 0, loss = 0.0084 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0213 --- Epoch 774 / 100000 Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0114 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0096 Iteration 80, loss = 0.0099 --- Epoch 775 / 100000 Iteration 0, loss = 0.0211 Iteration 20, loss = 0.0128 Iteration 40, loss = 0.0188 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0146 --- Epoch 776 / 100000 Iteration 0, loss = 0.0163 Iteration 20, loss = 0.0171 Iteration 40, loss = 0.0219 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0286 --- Epoch 777 / 100000 Iteration 0, loss = 0.0101 Iteration 20, loss = 0.0144 Iteration 40, loss = 0.0409 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0110 --- Epoch 778 / 100000 Iteration 0, loss = 0.0362 Iteration 20, loss = 0.0151 Iteration 40, loss = 0.0329 Iteration 60, loss = 0.0222 Iteration 80, loss = 0.0103 --- Epoch 779 / 100000 Iteration 0, loss = 0.0278 Iteration 20, loss = 0.0190 Iteration 40, loss = 0.0118 Iteration 60, loss = 0.0148 Iteration 80, loss = 0.0113 --- Epoch 780 / 100000 Iteration 0, loss = 0.0297 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0148 --- Epoch 781 / 100000 Iteration 0, loss = 0.0198 Iteration 20, loss = 0.0134 Iteration 40, loss = 0.0199 Iteration 60, loss = 0.0207 Iteration 80, loss = 0.0191 --- Epoch 782 / 100000 Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0254 Iteration 40, loss = 0.0286 Iteration 60, loss = 0.0133 Iteration 80, loss = 0.0084 --- Epoch 783 / 100000 Iteration 0, loss = 0.0192 Iteration 20, loss = 0.0171 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0142 Iteration 80, loss = 0.0187 --- Epoch 784 / 100000 Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0182 Iteration 40, loss = 0.0084 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0085 --- Epoch 785 / 100000 Iteration 0, loss = 0.0168 Iteration 20, loss = 0.0199 Iteration 40, loss = 0.0167 Iteration 60, loss = 0.0178 Iteration 80, loss = 0.0169 --- Epoch 786 / 100000 Iteration 0, loss = 0.0191 Iteration 20, loss = 0.0485 Iteration 40, loss = 0.0245 Iteration 60, loss = 0.0202 Iteration 80, loss = 0.0299 --- Epoch 787 / 100000 Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0247 Iteration 60, loss = 0.0182 Iteration 80, loss = 0.0159 --- Epoch 788 / 100000 Iteration 0, loss = 0.0109 Iteration 20, loss = 0.0162 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0104 --- Epoch 789 / 100000 Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0322 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0203 Iteration 80, loss = 0.0163 --- Epoch 790 / 100000 Iteration 0, loss = 0.0140 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0161 Iteration 80, loss = 0.0129 --- Epoch 791 / 100000 Iteration 0, loss = 0.0189 Iteration 20, loss = 0.0147 Iteration 40, loss = 0.0245 Iteration 60, loss = 0.0144 Iteration 80, loss = 0.0094 --- Epoch 792 / 100000 Iteration 0, loss = 0.0135 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0152 Iteration 80, loss = 0.0100 --- Epoch 793 / 100000 Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0146 Iteration 40, loss = 0.0168 Iteration 60, loss = 0.0169 Iteration 80, loss = 0.0117 --- Epoch 794 / 100000 Iteration 0, loss = 0.0155 Iteration 20, loss = 0.0193 Iteration 40, loss = 0.0213 Iteration 60, loss = 0.0160 Iteration 80, loss = 0.0103 --- Epoch 795 / 100000 Iteration 0, loss = 0.0154 Iteration 20, loss = 0.0245 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0181 Iteration 80, loss = 0.0196 --- Epoch 796 / 100000 Iteration 0, loss = 0.0245 Iteration 20, loss = 0.0176 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0181 Iteration 80, loss = 0.0098 --- Epoch 797 / 100000 Iteration 0, loss = 0.0161 Iteration 20, loss = 0.0165 Iteration 40, loss = 0.0233 Iteration 60, loss = 0.0186 Iteration 80, loss = 0.0198 --- Epoch 798 / 100000 Iteration 0, loss = 0.0329 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0172 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0118 --- Epoch 799 / 100000 Iteration 0, loss = 0.0231 Iteration 20, loss = 0.0163 Iteration 40, loss = 0.0169 Iteration 60, loss = 0.0221 Iteration 80, loss = 0.0144 --- Epoch 800 / 100000 Iteration 0, loss = 0.0220 Iteration 20, loss = 0.0159 Iteration 40, loss = 0.0217 Iteration 60, loss = 0.0197 Iteration 80, loss = 0.0120 --- Epoch 801 / 100000 Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0165 Iteration 80, loss = 0.0170 --- Epoch 802 / 100000 Iteration 0, loss = 0.0128 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0227 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0103 --- Epoch 803 / 100000 Iteration 0, loss = 0.0124 Iteration 20, loss = 0.0158 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0173 Iteration 80, loss = 0.0246 --- Epoch 804 / 100000 Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0085 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0168 Iteration 80, loss = 0.0115 --- Epoch 805 / 100000 Iteration 0, loss = 0.0084 Iteration 20, loss = 0.0172 Iteration 40, loss = 0.0189 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0096 --- Epoch 806 / 100000 Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0137 Iteration 40, loss = 0.0131 Iteration 60, loss = 0.0111 Iteration 80, loss = 0.0145 --- Epoch 807 / 100000 Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0156 Iteration 80, loss = 0.0156 --- Epoch 808 / 100000 Iteration 0, loss = 0.0369 Iteration 20, loss = 0.0207 Iteration 40, loss = 0.0140 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0182 --- Epoch 809 / 100000 Iteration 0, loss = 0.0147 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0140 Iteration 80, loss = 0.0163 --- Epoch 810 / 100000 Iteration 0, loss = 0.0186 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0248 Iteration 60, loss = 0.0163 Iteration 80, loss = 0.0600 --- Epoch 811 / 100000 Iteration 0, loss = 0.0199 Iteration 20, loss = 0.0087 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0157 --- Epoch 812 / 100000 Iteration 0, loss = 0.0192 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0140 Iteration 60, loss = 0.0102 Iteration 80, loss = 0.0162 --- Epoch 813 / 100000 Iteration 0, loss = 0.0144 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0203 Iteration 80, loss = 0.0122 --- Epoch 814 / 100000 Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0194 Iteration 40, loss = 0.0084 Iteration 60, loss = 0.0194 Iteration 80, loss = 0.0182 --- Epoch 815 / 100000 Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0123 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0172 --- Epoch 816 / 100000 Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0099 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0171 Iteration 80, loss = 0.0107 --- Epoch 817 / 100000 Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0200 Iteration 40, loss = 0.0265 Iteration 60, loss = 0.0224 Iteration 80, loss = 0.0229 --- Epoch 818 / 100000 Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0116 Iteration 40, loss = 0.0190 Iteration 60, loss = 0.0216 Iteration 80, loss = 0.0098 --- Epoch 819 / 100000 Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0259 Iteration 40, loss = 0.0169 Iteration 60, loss = 0.0331 Iteration 80, loss = 0.0183 --- Epoch 820 / 100000 Iteration 0, loss = 0.0208 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0303 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0172 --- Epoch 821 / 100000 Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0128 Iteration 60, loss = 0.0178 Iteration 80, loss = 0.0158 --- Epoch 822 / 100000 Iteration 0, loss = 0.0085 Iteration 20, loss = 0.0198 Iteration 40, loss = 0.0257 Iteration 60, loss = 0.0135 Iteration 80, loss = 0.0098 --- Epoch 823 / 100000 Iteration 0, loss = 0.0165 Iteration 20, loss = 0.0227 Iteration 40, loss = 0.0090 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0070 --- Epoch 824 / 100000 Iteration 0, loss = 0.0305 Iteration 20, loss = 0.0148 Iteration 40, loss = 0.0262 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0129 --- Epoch 825 / 100000 Iteration 0, loss = 0.0090 Iteration 20, loss = 0.0153 Iteration 40, loss = 0.0153 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0302 --- Epoch 826 / 100000 Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0175 Iteration 80, loss = 0.0206 --- Epoch 827 / 100000 Iteration 0, loss = 0.0104 Iteration 20, loss = 0.0156 Iteration 40, loss = 0.0134 Iteration 60, loss = 0.0302 Iteration 80, loss = 0.0263 --- Epoch 828 / 100000 Iteration 0, loss = 0.0137 Iteration 20, loss = 0.0114 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0130 Iteration 80, loss = 0.0247 --- Epoch 829 / 100000 Iteration 0, loss = 0.0159 Iteration 20, loss = 0.0328 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0163 --- Epoch 830 / 100000 Iteration 0, loss = 0.0116 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0254 Iteration 60, loss = 0.0150 Iteration 80, loss = 0.0104 --- Epoch 831 / 100000 Iteration 0, loss = 0.0159 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0146 Iteration 60, loss = 0.0217 Iteration 80, loss = 0.0153 --- Epoch 832 / 100000 Iteration 0, loss = 0.0165 Iteration 20, loss = 0.0148 Iteration 40, loss = 0.0169 Iteration 60, loss = 0.0283 Iteration 80, loss = 0.0122 --- Epoch 833 / 100000 Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0137 Iteration 40, loss = 0.0234 Iteration 60, loss = 0.0120 Iteration 80, loss = 0.0083 --- Epoch 834 / 100000 Iteration 0, loss = 0.0238 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0281 Iteration 60, loss = 0.0210 Iteration 80, loss = 0.0197 --- Epoch 835 / 100000 Iteration 0, loss = 0.0153 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0262 --- Epoch 836 / 100000 Iteration 0, loss = 0.0124 Iteration 20, loss = 0.0196 Iteration 40, loss = 0.0201 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0128 --- Epoch 837 / 100000 Iteration 0, loss = 0.0244 Iteration 20, loss = 0.0151 Iteration 40, loss = 0.0113 Iteration 60, loss = 0.0240 Iteration 80, loss = 0.0197 --- Epoch 838 / 100000 Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0109 Iteration 40, loss = 0.0294 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0131 --- Epoch 839 / 100000 Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0096 Iteration 40, loss = 0.0139 Iteration 60, loss = 0.0113 Iteration 80, loss = 0.0144 --- Epoch 840 / 100000 Iteration 0, loss = 0.0082 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0089 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0122 --- Epoch 841 / 100000 Iteration 0, loss = 0.0219 Iteration 20, loss = 0.0208 Iteration 40, loss = 0.0266 Iteration 60, loss = 0.0290 Iteration 80, loss = 0.0088 --- Epoch 842 / 100000 Iteration 0, loss = 0.0146 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0092 Iteration 60, loss = 0.0135 Iteration 80, loss = 0.0107 --- Epoch 843 / 100000 Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0111 Iteration 80, loss = 0.0190 --- Epoch 844 / 100000 Iteration 0, loss = 0.0189 Iteration 20, loss = 0.0108 Iteration 40, loss = 0.0320 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0234 --- Epoch 845 / 100000 Iteration 0, loss = 0.0110 Iteration 20, loss = 0.0158 Iteration 40, loss = 0.0088 Iteration 60, loss = 0.0240 Iteration 80, loss = 0.0118 --- Epoch 846 / 100000 Iteration 0, loss = 0.0177 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0396 Iteration 60, loss = 0.0408 Iteration 80, loss = 0.0158 --- Epoch 847 / 100000 Iteration 0, loss = 0.0133 Iteration 20, loss = 0.0185 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0062 --- Epoch 848 / 100000 Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0213 Iteration 80, loss = 0.0114 --- Epoch 849 / 100000 Iteration 0, loss = 0.0110 Iteration 20, loss = 0.0109 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0539 Iteration 80, loss = 0.0182 --- Epoch 850 / 100000 Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0153 Iteration 40, loss = 0.0150 Iteration 60, loss = 0.0268 Iteration 80, loss = 0.0120 --- Epoch 851 / 100000 Iteration 0, loss = 0.0177 Iteration 20, loss = 0.0096 Iteration 40, loss = 0.0159 Iteration 60, loss = 0.0135 Iteration 80, loss = 0.0114 --- Epoch 852 / 100000 Iteration 0, loss = 0.0147 Iteration 20, loss = 0.0154 Iteration 40, loss = 0.0229 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0134 --- Epoch 853 / 100000 Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0174 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0473 Iteration 80, loss = 0.0124 --- Epoch 854 / 100000 Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0166 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0144 Iteration 80, loss = 0.0181 --- Epoch 855 / 100000 Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0298 Iteration 60, loss = 0.0146 Iteration 80, loss = 0.0135 --- Epoch 856 / 100000 Iteration 0, loss = 0.0175 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0164 Iteration 60, loss = 0.0210 Iteration 80, loss = 0.0262 --- Epoch 857 / 100000 Iteration 0, loss = 0.0141 Iteration 20, loss = 0.0166 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0096 Iteration 80, loss = 0.0081 --- Epoch 858 / 100000 Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0154 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0125 Iteration 80, loss = 0.0122 --- Epoch 859 / 100000 Iteration 0, loss = 0.0300 Iteration 20, loss = 0.0356 Iteration 40, loss = 0.0367 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0346 --- Epoch 860 / 100000 Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0138 Iteration 40, loss = 0.0177 Iteration 60, loss = 0.0082 Iteration 80, loss = 0.0245 --- Epoch 861 / 100000 Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0496 Iteration 40, loss = 0.0136 Iteration 60, loss = 0.0121 Iteration 80, loss = 0.0353 --- Epoch 862 / 100000 Iteration 0, loss = 0.0165 Iteration 20, loss = 0.0289 Iteration 40, loss = 0.0106 Iteration 60, loss = 0.0113 Iteration 80, loss = 0.0074 --- Epoch 863 / 100000 Iteration 0, loss = 0.0216 Iteration 20, loss = 0.0201 Iteration 40, loss = 0.0205 Iteration 60, loss = 0.0117 Iteration 80, loss = 0.0267 --- Epoch 864 / 100000 Iteration 0, loss = 0.0246 Iteration 20, loss = 0.0429 Iteration 40, loss = 0.0097 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0109 --- Epoch 865 / 100000 Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0167 Iteration 40, loss = 0.0139 Iteration 60, loss = 0.0114 Iteration 80, loss = 0.0146 --- Epoch 866 / 100000 Iteration 0, loss = 0.0152 Iteration 20, loss = 0.0087 Iteration 40, loss = 0.0108 Iteration 60, loss = 0.0199 Iteration 80, loss = 0.0114 --- Epoch 867 / 100000 Iteration 0, loss = 0.0146 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0153 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0123 --- Epoch 868 / 100000 Iteration 0, loss = 0.0104 Iteration 20, loss = 0.0149 Iteration 40, loss = 0.0112 Iteration 60, loss = 0.0161 Iteration 80, loss = 0.0193 --- Epoch 869 / 100000 Iteration 0, loss = 0.0172 Iteration 20, loss = 0.0148 Iteration 40, loss = 0.0628 Iteration 60, loss = 0.0102 Iteration 80, loss = 0.0102 --- Epoch 870 / 100000 Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0133 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0326 Iteration 80, loss = 0.0107 --- Epoch 871 / 100000 Iteration 0, loss = 0.0315 Iteration 20, loss = 0.0106 Iteration 40, loss = 0.0113 Iteration 60, loss = 0.0102 Iteration 80, loss = 0.0282 --- Epoch 872 / 100000 Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0154 Iteration 40, loss = 0.0191 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0152 --- Epoch 873 / 100000 Iteration 0, loss = 0.0104 Iteration 20, loss = 0.0201 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0151 Iteration 80, loss = 0.0148 --- Epoch 874 / 100000 Iteration 0, loss = 0.0158 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0099 Iteration 80, loss = 0.0338 --- Epoch 875 / 100000 Iteration 0, loss = 0.0349 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0183 Iteration 80, loss = 0.0205 --- Epoch 876 / 100000 Iteration 0, loss = 0.0162 Iteration 20, loss = 0.0193 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0184 Iteration 80, loss = 0.0273 --- Epoch 877 / 100000 Iteration 0, loss = 0.0172 Iteration 20, loss = 0.0130 Iteration 40, loss = 0.0192 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0312 --- Epoch 878 / 100000 Iteration 0, loss = 0.0175 Iteration 20, loss = 0.0149 Iteration 40, loss = 0.0321 Iteration 60, loss = 0.0127 Iteration 80, loss = 0.0082 --- Epoch 879 / 100000 Iteration 0, loss = 0.0184 Iteration 20, loss = 0.0231 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0117 --- Epoch 880 / 100000 Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0100 Iteration 40, loss = 0.0213 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0099 --- Epoch 881 / 100000 Iteration 0, loss = 0.0128 Iteration 20, loss = 0.0134 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0186 --- Epoch 882 / 100000 Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0361 Iteration 60, loss = 0.0253 Iteration 80, loss = 0.0149 --- Epoch 883 / 100000 Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0154 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0079 --- Epoch 884 / 100000 Iteration 0, loss = 0.0124 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0286 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0120 --- Epoch 885 / 100000 Iteration 0, loss = 0.0109 Iteration 20, loss = 0.0235 Iteration 40, loss = 0.0101 Iteration 60, loss = 0.0216 Iteration 80, loss = 0.0108 --- Epoch 886 / 100000 Iteration 0, loss = 0.0100 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0338 Iteration 60, loss = 0.0169 Iteration 80, loss = 0.0077 --- Epoch 887 / 100000 Iteration 0, loss = 0.0181 Iteration 20, loss = 0.0131 Iteration 40, loss = 0.0158 Iteration 60, loss = 0.0160 Iteration 80, loss = 0.0085 --- Epoch 888 / 100000 Iteration 0, loss = 0.0116 Iteration 20, loss = 0.0369 Iteration 40, loss = 0.0181 Iteration 60, loss = 0.0152 Iteration 80, loss = 0.0160 --- Epoch 889 / 100000 Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0081 Iteration 60, loss = 0.0323 Iteration 80, loss = 0.0274 --- Epoch 890 / 100000 Iteration 0, loss = 0.0103 Iteration 20, loss = 0.0252 Iteration 40, loss = 0.0183 Iteration 60, loss = 0.0198 Iteration 80, loss = 0.0229 --- Epoch 891 / 100000 Iteration 0, loss = 0.0085 Iteration 20, loss = 0.0106 Iteration 40, loss = 0.0358 Iteration 60, loss = 0.0113 Iteration 80, loss = 0.0151 --- Epoch 892 / 100000 Iteration 0, loss = 0.0146 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0133 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0144 --- Epoch 893 / 100000 Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0245 Iteration 60, loss = 0.0413 Iteration 80, loss = 0.0129 --- Epoch 894 / 100000 Iteration 0, loss = 0.0183 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0173 Iteration 60, loss = 0.0099 Iteration 80, loss = 0.0073 --- Epoch 895 / 100000 Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0164 Iteration 40, loss = 0.0217 Iteration 60, loss = 0.0114 Iteration 80, loss = 0.0194 --- Epoch 896 / 100000 Iteration 0, loss = 0.0124 Iteration 20, loss = 0.0116 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0180 Iteration 80, loss = 0.0117 --- Epoch 897 / 100000 Iteration 0, loss = 0.0110 Iteration 20, loss = 0.0147 Iteration 40, loss = 0.0194 Iteration 60, loss = 0.0293 Iteration 80, loss = 0.0153 --- Epoch 898 / 100000 Iteration 0, loss = 0.0208 Iteration 20, loss = 0.0233 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0138 Iteration 80, loss = 0.0130 --- Epoch 899 / 100000 Iteration 0, loss = 0.0144 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0169 Iteration 80, loss = 0.0175 --- Epoch 900 / 100000 Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0133 Iteration 40, loss = 0.0131 Iteration 60, loss = 0.0126 Iteration 80, loss = 0.0124 --- Epoch 901 / 100000 Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0263 Iteration 40, loss = 0.0160 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0161 --- Epoch 902 / 100000 Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0264 Iteration 40, loss = 0.0257 Iteration 60, loss = 0.0195 Iteration 80, loss = 0.0205 --- Epoch 903 / 100000 Iteration 0, loss = 0.0335 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0081 Iteration 60, loss = 0.0124 Iteration 80, loss = 0.0081 --- Epoch 904 / 100000 Iteration 0, loss = 0.0158 Iteration 20, loss = 0.0419 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0151 Iteration 80, loss = 0.0135 --- Epoch 905 / 100000 Iteration 0, loss = 0.0133 Iteration 20, loss = 0.0181 Iteration 40, loss = 0.0176 Iteration 60, loss = 0.0148 Iteration 80, loss = 0.0238 --- Epoch 906 / 100000 Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0109 Iteration 40, loss = 0.0123 Iteration 60, loss = 0.0173 Iteration 80, loss = 0.0158 --- Epoch 907 / 100000 Iteration 0, loss = 0.0123 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0168 Iteration 60, loss = 0.0234 Iteration 80, loss = 0.0166 --- Epoch 908 / 100000 Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0224 Iteration 80, loss = 0.0108 --- Epoch 909 / 100000 Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0101 Iteration 60, loss = 0.0229 Iteration 80, loss = 0.0090 --- Epoch 910 / 100000 Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0402 Iteration 40, loss = 0.0097 Iteration 60, loss = 0.0247 Iteration 80, loss = 0.0421 --- Epoch 911 / 100000 Iteration 0, loss = 0.0165 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0334 Iteration 80, loss = 0.0163 --- Epoch 912 / 100000 Iteration 0, loss = 0.0140 Iteration 20, loss = 0.0186 Iteration 40, loss = 0.0131 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0145 --- Epoch 913 / 100000 Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0194 Iteration 60, loss = 0.0142 Iteration 80, loss = 0.0121 --- Epoch 914 / 100000 Iteration 0, loss = 0.0195 Iteration 20, loss = 0.0265 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0260 Iteration 80, loss = 0.0140 --- Epoch 915 / 100000 Iteration 0, loss = 0.0133 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0198 Iteration 80, loss = 0.0100 --- Epoch 916 / 100000 Iteration 0, loss = 0.0181 Iteration 20, loss = 0.0205 Iteration 40, loss = 0.0175 Iteration 60, loss = 0.0120 Iteration 80, loss = 0.0218 --- Epoch 917 / 100000 Iteration 0, loss = 0.0197 Iteration 20, loss = 0.0269 Iteration 40, loss = 0.0162 Iteration 60, loss = 0.0157 Iteration 80, loss = 0.0099 --- Epoch 918 / 100000 Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0180 Iteration 40, loss = 0.0170 Iteration 60, loss = 0.0145 Iteration 80, loss = 0.0212 --- Epoch 919 / 100000 Iteration 0, loss = 0.0362 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0136 Iteration 60, loss = 0.0166 Iteration 80, loss = 0.0161 --- Epoch 920 / 100000 Iteration 0, loss = 0.0196 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0138 Iteration 80, loss = 0.0147 --- Epoch 921 / 100000 Iteration 0, loss = 0.0180 Iteration 20, loss = 0.0170 Iteration 40, loss = 0.0200 Iteration 60, loss = 0.0140 Iteration 80, loss = 0.0145 --- Epoch 922 / 100000 Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0141 Iteration 40, loss = 0.0126 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0115 --- Epoch 923 / 100000 Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0085 Iteration 40, loss = 0.0181 Iteration 60, loss = 0.0138 Iteration 80, loss = 0.0250 --- Epoch 924 / 100000 Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0176 Iteration 60, loss = 0.0280 Iteration 80, loss = 0.0213 --- Epoch 925 / 100000 Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0152 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0153 Iteration 80, loss = 0.0158 --- Epoch 926 / 100000 Iteration 0, loss = 0.0262 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0263 Iteration 60, loss = 0.0127 Iteration 80, loss = 0.0144 --- Epoch 927 / 100000 Iteration 0, loss = 0.0223 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0092 Iteration 60, loss = 0.0166 Iteration 80, loss = 0.0198 --- Epoch 928 / 100000 Iteration 0, loss = 0.0144 Iteration 20, loss = 0.0158 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0193 Iteration 80, loss = 0.0099 --- Epoch 929 / 100000 Iteration 0, loss = 0.0155 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0084 --- Epoch 930 / 100000 Iteration 0, loss = 0.0153 Iteration 20, loss = 0.0164 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0208 Iteration 80, loss = 0.0233 --- Epoch 931 / 100000 Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0177 Iteration 40, loss = 0.0128 Iteration 60, loss = 0.0125 Iteration 80, loss = 0.0157 --- Epoch 932 / 100000 Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0300 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0153 --- Epoch 933 / 100000 Iteration 0, loss = 0.0146 Iteration 20, loss = 0.0147 Iteration 40, loss = 0.0150 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0110 --- Epoch 934 / 100000 Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0132 Iteration 40, loss = 0.0134 Iteration 60, loss = 0.0140 Iteration 80, loss = 0.0197 --- Epoch 935 / 100000 Iteration 0, loss = 0.0292 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0232 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0126 --- Epoch 936 / 100000 Iteration 0, loss = 0.0159 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0133 Iteration 60, loss = 0.0162 Iteration 80, loss = 0.0283 --- Epoch 937 / 100000 Iteration 0, loss = 0.0139 Iteration 20, loss = 0.0278 Iteration 40, loss = 0.0303 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0660 --- Epoch 938 / 100000 Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0283 Iteration 40, loss = 0.0190 Iteration 60, loss = 0.0111 Iteration 80, loss = 0.0137 --- Epoch 939 / 100000 Iteration 0, loss = 0.0104 Iteration 20, loss = 0.0226 Iteration 40, loss = 0.0188 Iteration 60, loss = 0.0123 Iteration 80, loss = 0.0085 --- Epoch 940 / 100000 Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0127 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0128 Iteration 80, loss = 0.0076 --- Epoch 941 / 100000 Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0159 Iteration 40, loss = 0.0092 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0078 --- Epoch 942 / 100000 Iteration 0, loss = 0.0137 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0170 Iteration 80, loss = 0.0198 --- Epoch 943 / 100000 Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0123 Iteration 40, loss = 0.0118 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0077 --- Epoch 944 / 100000 Iteration 0, loss = 0.0161 Iteration 20, loss = 0.0422 Iteration 40, loss = 0.0175 Iteration 60, loss = 0.0147 Iteration 80, loss = 0.0143 --- Epoch 945 / 100000 Iteration 0, loss = 0.0415 Iteration 20, loss = 0.0115 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0177 --- Epoch 946 / 100000 Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0120 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0230 --- Epoch 947 / 100000 Iteration 0, loss = 0.0096 Iteration 20, loss = 0.0247 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0134 Iteration 80, loss = 0.0403 --- Epoch 948 / 100000 Iteration 0, loss = 0.0137 Iteration 20, loss = 0.0112 Iteration 40, loss = 0.0249 Iteration 60, loss = 0.0099 Iteration 80, loss = 0.0174 --- Epoch 949 / 100000 Iteration 0, loss = 0.0152 Iteration 20, loss = 0.0171 Iteration 40, loss = 0.0250 Iteration 60, loss = 0.0117 Iteration 80, loss = 0.0089 --- Epoch 950 / 100000 Iteration 0, loss = 0.0133 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0147 Iteration 60, loss = 0.0164 Iteration 80, loss = 0.0238 --- Epoch 951 / 100000 Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0286 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0183 --- Epoch 952 / 100000 Iteration 0, loss = 0.0213 Iteration 20, loss = 0.0128 Iteration 40, loss = 0.0247 Iteration 60, loss = 0.0156 Iteration 80, loss = 0.0083 --- Epoch 953 / 100000 Iteration 0, loss = 0.0242 Iteration 20, loss = 0.0154 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0196 Iteration 80, loss = 0.0103 --- Epoch 954 / 100000 Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0088 Iteration 60, loss = 0.0140 Iteration 80, loss = 0.0077 --- Epoch 955 / 100000 Iteration 0, loss = 0.0294 Iteration 20, loss = 0.0090 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0141 --- Epoch 956 / 100000 Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0145 Iteration 60, loss = 0.0163 Iteration 80, loss = 0.0132 --- Epoch 957 / 100000 Iteration 0, loss = 0.0208 Iteration 20, loss = 0.0384 Iteration 40, loss = 0.0242 Iteration 60, loss = 0.0127 Iteration 80, loss = 0.0097 --- Epoch 958 / 100000 Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0203 Iteration 60, loss = 0.0133 Iteration 80, loss = 0.0075 --- Epoch 959 / 100000 Iteration 0, loss = 0.0147 Iteration 20, loss = 0.0140 Iteration 40, loss = 0.0120 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0115 --- Epoch 960 / 100000 Iteration 0, loss = 0.0123 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0211 Iteration 60, loss = 0.0136 Iteration 80, loss = 0.0279 --- Epoch 961 / 100000 Iteration 0, loss = 0.0350 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0237 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0109 --- Epoch 962 / 100000 Iteration 0, loss = 0.0180 Iteration 20, loss = 0.0134 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0156 Iteration 80, loss = 0.0150 --- Epoch 963 / 100000 Iteration 0, loss = 0.0170 Iteration 20, loss = 0.0087 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0126 --- Epoch 964 / 100000 Iteration 0, loss = 0.0210 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0171 Iteration 60, loss = 0.0147 Iteration 80, loss = 0.0091 --- Epoch 965 / 100000 Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0267 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0139 Iteration 80, loss = 0.0209 --- Epoch 966 / 100000 Iteration 0, loss = 0.0124 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0132 Iteration 60, loss = 0.0161 Iteration 80, loss = 0.0216 --- Epoch 967 / 100000 Iteration 0, loss = 0.0113 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0213 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0173 --- Epoch 968 / 100000 Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0126 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0151 Iteration 80, loss = 0.0228 --- Epoch 969 / 100000 Iteration 0, loss = 0.0104 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0102 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0672 --- Epoch 970 / 100000 Iteration 0, loss = 0.0139 Iteration 20, loss = 0.0114 Iteration 40, loss = 0.0102 Iteration 60, loss = 0.0237 Iteration 80, loss = 0.0243 --- Epoch 971 / 100000 Iteration 0, loss = 0.0116 Iteration 20, loss = 0.0191 Iteration 40, loss = 0.0133 Iteration 60, loss = 0.0177 Iteration 80, loss = 0.0167 --- Epoch 972 / 100000 Iteration 0, loss = 0.0185 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0276 Iteration 60, loss = 0.0388 Iteration 80, loss = 0.0113 --- Epoch 973 / 100000 Iteration 0, loss = 0.0128 Iteration 20, loss = 0.0218 Iteration 40, loss = 0.0097 Iteration 60, loss = 0.0142 Iteration 80, loss = 0.0136 --- Epoch 974 / 100000 Iteration 0, loss = 0.0090 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0124 Iteration 80, loss = 0.0148 --- Epoch 975 / 100000 Iteration 0, loss = 0.0219 Iteration 20, loss = 0.0165 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0150 Iteration 80, loss = 0.0195 --- Epoch 976 / 100000 Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0113 Iteration 60, loss = 0.0113 Iteration 80, loss = 0.0107 --- Epoch 977 / 100000 Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0177 Iteration 80, loss = 0.0099 --- Epoch 978 / 100000 Iteration 0, loss = 0.0159 Iteration 20, loss = 0.0172 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0119 --- Epoch 979 / 100000 Iteration 0, loss = 0.0145 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0133 Iteration 80, loss = 0.0256 --- Epoch 980 / 100000 Iteration 0, loss = 0.0104 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0164 --- Epoch 981 / 100000 Iteration 0, loss = 0.0133 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0118 Iteration 60, loss = 0.0097 Iteration 80, loss = 0.0175 --- Epoch 982 / 100000 Iteration 0, loss = 0.0184 Iteration 20, loss = 0.0226 Iteration 40, loss = 0.0133 Iteration 60, loss = 0.0193 Iteration 80, loss = 0.0114 --- Epoch 983 / 100000 Iteration 0, loss = 0.0182 Iteration 20, loss = 0.0099 Iteration 40, loss = 0.0123 Iteration 60, loss = 0.0111 Iteration 80, loss = 0.0112 --- Epoch 984 / 100000 Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0242 Iteration 40, loss = 0.0183 Iteration 60, loss = 0.0204 Iteration 80, loss = 0.0129 --- Epoch 985 / 100000 Iteration 0, loss = 0.0144 Iteration 20, loss = 0.0126 Iteration 40, loss = 0.0231 Iteration 60, loss = 0.0131 Iteration 80, loss = 0.0095 --- Epoch 986 / 100000 Iteration 0, loss = 0.0265 Iteration 20, loss = 0.0164 Iteration 40, loss = 0.0102 Iteration 60, loss = 0.0147 Iteration 80, loss = 0.0257 --- Epoch 987 / 100000 Iteration 0, loss = 0.0120 Iteration 20, loss = 0.0116 Iteration 40, loss = 0.0175 Iteration 60, loss = 0.0184 Iteration 80, loss = 0.0204 --- Epoch 988 / 100000 Iteration 0, loss = 0.0160 Iteration 20, loss = 0.0065 Iteration 40, loss = 0.0157 Iteration 60, loss = 0.0279 Iteration 80, loss = 0.0277 --- Epoch 989 / 100000 Iteration 0, loss = 0.0166 Iteration 20, loss = 0.0149 Iteration 40, loss = 0.0141 Iteration 60, loss = 0.0082 Iteration 80, loss = 0.0077 --- Epoch 990 / 100000 Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0169 Iteration 40, loss = 0.0243 Iteration 60, loss = 0.0243 Iteration 80, loss = 0.0210 --- Epoch 991 / 100000 Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0127 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0160 Iteration 80, loss = 0.0097 --- Epoch 992 / 100000 Iteration 0, loss = 0.0101 Iteration 20, loss = 0.0232 Iteration 40, loss = 0.0185 Iteration 60, loss = 0.0208 Iteration 80, loss = 0.0174 --- Epoch 993 / 100000 Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0191 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0286 Iteration 80, loss = 0.0142 --- Epoch 994 / 100000 Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0231 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0171 Iteration 80, loss = 0.0198 --- Epoch 995 / 100000 Iteration 0, loss = 0.0230 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0106 --- Epoch 996 / 100000 Iteration 0, loss = 0.0186 Iteration 20, loss = 0.0146 Iteration 40, loss = 0.0227 Iteration 60, loss = 0.0178 Iteration 80, loss = 0.0102 --- Epoch 997 / 100000 Iteration 0, loss = 0.0124 Iteration 20, loss = 0.0217 Iteration 40, loss = 0.0205 Iteration 60, loss = 0.0132 Iteration 80, loss = 0.0166 --- Epoch 998 / 100000 Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0171 Iteration 40, loss = 0.0124 Iteration 60, loss = 0.0128 Iteration 80, loss = 0.0206 --- Epoch 999 / 100000 Iteration 0, loss = 0.0311 Iteration 20, loss = 0.0152 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0186 Iteration 80, loss = 0.0155 --- Epoch 1000 / 100000 Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0177 Iteration 40, loss = 0.0290 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0192 --- Epoch 1001 / 100000 Iteration 0, loss = 0.0148 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0215 Iteration 60, loss = 0.0121 Iteration 80, loss = 0.0172 --- Epoch 1002 / 100000 Iteration 0, loss = 0.0120 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0356 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0185 --- Epoch 1003 / 100000 Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0342 Iteration 60, loss = 0.0367 Iteration 80, loss = 0.0111 --- Epoch 1004 / 100000 Iteration 0, loss = 0.0155 Iteration 20, loss = 0.0253 Iteration 40, loss = 0.0145 Iteration 60, loss = 0.0256 Iteration 80, loss = 0.0208 --- Epoch 1005 / 100000 Iteration 0, loss = 0.0097 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0170 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0220 --- Epoch 1006 / 100000 Iteration 0, loss = 0.0224 Iteration 20, loss = 0.0180 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0177 --- Epoch 1007 / 100000 Iteration 0, loss = 0.0171 Iteration 20, loss = 0.0123 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0206 Iteration 80, loss = 0.0148 --- Epoch 1008 / 100000 Iteration 0, loss = 0.0127 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0141 Iteration 80, loss = 0.0058 --- Epoch 1009 / 100000 Iteration 0, loss = 0.0196 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0144 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0138 --- Epoch 1010 / 100000 Iteration 0, loss = 0.0145 Iteration 20, loss = 0.0133 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0137 Iteration 80, loss = 0.0056 --- Epoch 1011 / 100000 Iteration 0, loss = 0.0113 Iteration 20, loss = 0.0140 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0159 Iteration 80, loss = 0.0167 --- Epoch 1012 / 100000 Iteration 0, loss = 0.0100 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0139 Iteration 80, loss = 0.0103 --- Epoch 1013 / 100000 Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0230 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0103 --- Epoch 1014 / 100000 Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0399 Iteration 80, loss = 0.0091 --- Epoch 1015 / 100000 Iteration 0, loss = 0.0262 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0091 --- Epoch 1016 / 100000 Iteration 0, loss = 0.0257 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0118 Iteration 60, loss = 0.0116 Iteration 80, loss = 0.0173 --- Epoch 1017 / 100000 Iteration 0, loss = 0.0145 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0108 Iteration 80, loss = 0.0136 --- Epoch 1018 / 100000 Iteration 0, loss = 0.0158 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0171 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0118 --- Epoch 1019 / 100000 Iteration 0, loss = 0.0180 Iteration 20, loss = 0.0173 Iteration 40, loss = 0.0298 Iteration 60, loss = 0.0209 Iteration 80, loss = 0.0133 --- Epoch 1020 / 100000 Iteration 0, loss = 0.0194 Iteration 20, loss = 0.0114 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0114 --- Epoch 1021 / 100000 Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0087 Iteration 40, loss = 0.0177 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0302 --- Epoch 1022 / 100000 Iteration 0, loss = 0.0238 Iteration 20, loss = 0.0243 Iteration 40, loss = 0.0142 Iteration 60, loss = 0.0144 Iteration 80, loss = 0.0154 --- Epoch 1023 / 100000 Iteration 0, loss = 0.0110 Iteration 20, loss = 0.0189 Iteration 40, loss = 0.0175 Iteration 60, loss = 0.0186 Iteration 80, loss = 0.0112 --- Epoch 1024 / 100000 Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0270 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0144 --- Epoch 1025 / 100000 Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0150 Iteration 40, loss = 0.0139 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0222 --- Epoch 1026 / 100000 Iteration 0, loss = 0.0126 Iteration 20, loss = 0.0229 Iteration 40, loss = 0.0193 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0092 --- Epoch 1027 / 100000 Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0109 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0121 --- Epoch 1028 / 100000 Iteration 0, loss = 0.0096 Iteration 20, loss = 0.0201 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0234 --- Epoch 1029 / 100000 Iteration 0, loss = 0.0183 Iteration 20, loss = 0.0203 Iteration 40, loss = 0.0108 Iteration 60, loss = 0.0140 Iteration 80, loss = 0.0185 --- Epoch 1030 / 100000 Iteration 0, loss = 0.0133 Iteration 20, loss = 0.0123 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0190 Iteration 80, loss = 0.0142 --- Epoch 1031 / 100000 Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0138 Iteration 40, loss = 0.0155 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0092 --- Epoch 1032 / 100000 Iteration 0, loss = 0.0616 Iteration 20, loss = 0.0219 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0083 Iteration 80, loss = 0.0156 --- Epoch 1033 / 100000 Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0169 Iteration 40, loss = 0.0090 Iteration 60, loss = 0.0248 Iteration 80, loss = 0.0202 --- Epoch 1034 / 100000 Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0108 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0151 --- Epoch 1035 / 100000 Iteration 0, loss = 0.0128 Iteration 20, loss = 0.0145 Iteration 40, loss = 0.0128 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0163 --- Epoch 1036 / 100000 Iteration 0, loss = 0.0128 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0370 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0110 --- Epoch 1037 / 100000 Iteration 0, loss = 0.0128 Iteration 20, loss = 0.0138 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0193 --- Epoch 1038 / 100000 Iteration 0, loss = 0.0126 Iteration 20, loss = 0.0339 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0082 Iteration 80, loss = 0.0065 --- Epoch 1039 / 100000 Iteration 0, loss = 0.0090 Iteration 20, loss = 0.0096 Iteration 40, loss = 0.0106 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0150 --- Epoch 1040 / 100000 Iteration 0, loss = 0.0116 Iteration 20, loss = 0.0111 Iteration 40, loss = 0.0486 Iteration 60, loss = 0.0155 Iteration 80, loss = 0.0131 --- Epoch 1041 / 100000 Iteration 0, loss = 0.0223 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0176 Iteration 80, loss = 0.0164 --- Epoch 1042 / 100000 Iteration 0, loss = 0.0159 Iteration 20, loss = 0.0099 Iteration 40, loss = 0.0363 Iteration 60, loss = 0.0240 Iteration 80, loss = 0.0136 --- Epoch 1043 / 100000 Iteration 0, loss = 0.0223 Iteration 20, loss = 0.0195 Iteration 40, loss = 0.0108 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0095 --- Epoch 1044 / 100000 Iteration 0, loss = 0.0170 Iteration 20, loss = 0.0146 Iteration 40, loss = 0.0293 Iteration 60, loss = 0.0140 Iteration 80, loss = 0.0157 --- Epoch 1045 / 100000 Iteration 0, loss = 0.0148 Iteration 20, loss = 0.0192 Iteration 40, loss = 0.0106 Iteration 60, loss = 0.0153 Iteration 80, loss = 0.0251 --- Epoch 1046 / 100000 Iteration 0, loss = 0.0356 Iteration 20, loss = 0.0233 Iteration 40, loss = 0.0134 Iteration 60, loss = 0.0160 Iteration 80, loss = 0.0074 --- Epoch 1047 / 100000 Iteration 0, loss = 0.0251 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0140 Iteration 60, loss = 0.0217 Iteration 80, loss = 0.0072 --- Epoch 1048 / 100000 Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0172 --- Epoch 1049 / 100000 Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0128 --- Epoch 1050 / 100000 Iteration 0, loss = 0.0101 Iteration 20, loss = 0.0145 Iteration 40, loss = 0.0258 Iteration 60, loss = 0.0447 Iteration 80, loss = 0.0154 --- Epoch 1051 / 100000 Iteration 0, loss = 0.0173 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0113 Iteration 60, loss = 0.0126 Iteration 80, loss = 0.0176 --- Epoch 1052 / 100000 Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0158 Iteration 60, loss = 0.0193 Iteration 80, loss = 0.0452 --- Epoch 1053 / 100000 Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0213 Iteration 60, loss = 0.0350 Iteration 80, loss = 0.0130 --- Epoch 1054 / 100000 Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0113 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0227 --- Epoch 1055 / 100000 Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0084 Iteration 60, loss = 0.0108 Iteration 80, loss = 0.0111 --- Epoch 1056 / 100000 Iteration 0, loss = 0.0124 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0254 Iteration 60, loss = 0.0164 Iteration 80, loss = 0.0139 --- Epoch 1057 / 100000 Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0189 Iteration 40, loss = 0.0152 Iteration 60, loss = 0.0159 Iteration 80, loss = 0.0146 --- Epoch 1058 / 100000 Iteration 0, loss = 0.0163 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0123 Iteration 60, loss = 0.0249 Iteration 80, loss = 0.0176 --- Epoch 1059 / 100000 Iteration 0, loss = 0.0183 Iteration 20, loss = 0.0172 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0111 --- Epoch 1060 / 100000 Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0155 Iteration 40, loss = 0.0150 Iteration 60, loss = 0.0172 Iteration 80, loss = 0.0152 --- Epoch 1061 / 100000 Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0132 Iteration 40, loss = 0.0358 Iteration 60, loss = 0.0099 Iteration 80, loss = 0.0160 --- Epoch 1062 / 100000 Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0175 Iteration 40, loss = 0.0189 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0175 --- Epoch 1063 / 100000 Iteration 0, loss = 0.0096 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0325 Iteration 80, loss = 0.0151 --- Epoch 1064 / 100000 Iteration 0, loss = 0.0110 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0092 --- Epoch 1065 / 100000 Iteration 0, loss = 0.0129 Iteration 20, loss = 0.0364 Iteration 40, loss = 0.0164 Iteration 60, loss = 0.0320 Iteration 80, loss = 0.0161 --- Epoch 1066 / 100000 Iteration 0, loss = 0.0109 Iteration 20, loss = 0.0115 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0145 Iteration 80, loss = 0.0118 --- Epoch 1067 / 100000 Iteration 0, loss = 0.0137 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0282 Iteration 60, loss = 0.0182 Iteration 80, loss = 0.0304 --- Epoch 1068 / 100000 Iteration 0, loss = 0.0222 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0125 --- Epoch 1069 / 100000 Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0111 --- Epoch 1070 / 100000 Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0124 Iteration 40, loss = 0.0147 Iteration 60, loss = 0.0130 Iteration 80, loss = 0.0109 --- Epoch 1071 / 100000 Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0243 Iteration 40, loss = 0.0195 Iteration 60, loss = 0.0117 Iteration 80, loss = 0.0114 --- Epoch 1072 / 100000 Iteration 0, loss = 0.0212 Iteration 20, loss = 0.0195 Iteration 40, loss = 0.0289 Iteration 60, loss = 0.0142 Iteration 80, loss = 0.0092 --- Epoch 1073 / 100000 Iteration 0, loss = 0.0333 Iteration 20, loss = 0.0151 Iteration 40, loss = 0.0102 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0087 --- Epoch 1074 / 100000 Iteration 0, loss = 0.0191 Iteration 20, loss = 0.0132 Iteration 40, loss = 0.0118 Iteration 60, loss = 0.0273 Iteration 80, loss = 0.0116 --- Epoch 1075 / 100000 Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0135 --- Epoch 1076 / 100000 Iteration 0, loss = 0.0130 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0117 --- Epoch 1077 / 100000 Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0115 Iteration 40, loss = 0.0162 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0171 --- Epoch 1078 / 100000 Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0108 Iteration 40, loss = 0.0240 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0177 --- Epoch 1079 / 100000 Iteration 0, loss = 0.0229 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0134 Iteration 60, loss = 0.0176 Iteration 80, loss = 0.0114 --- Epoch 1080 / 100000 Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0138 Iteration 40, loss = 0.0101 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0186 --- Epoch 1081 / 100000 Iteration 0, loss = 0.0178 Iteration 20, loss = 0.0237 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0126 --- Epoch 1082 / 100000 Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0116 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0138 Iteration 80, loss = 0.0148 --- Epoch 1083 / 100000 Iteration 0, loss = 0.0104 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0113 Iteration 80, loss = 0.0082 --- Epoch 1084 / 100000 Iteration 0, loss = 0.0150 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0132 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0078 --- Epoch 1085 / 100000 Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0148 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0130 Iteration 80, loss = 0.0175 --- Epoch 1086 / 100000 Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0156 Iteration 80, loss = 0.0126 --- Epoch 1087 / 100000 Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0148 Iteration 40, loss = 0.0201 Iteration 60, loss = 0.0123 Iteration 80, loss = 0.0108 --- Epoch 1088 / 100000 Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0205 Iteration 40, loss = 0.0142 Iteration 60, loss = 0.0145 Iteration 80, loss = 0.0131 --- Epoch 1089 / 100000 Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0166 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0069 --- Epoch 1090 / 100000 Iteration 0, loss = 0.0110 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0093 Iteration 60, loss = 0.0114 Iteration 80, loss = 0.0094 --- Epoch 1091 / 100000 Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0147 Iteration 40, loss = 0.0159 Iteration 60, loss = 0.0198 Iteration 80, loss = 0.0114 --- Epoch 1092 / 100000 Iteration 0, loss = 0.0153 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0155 Iteration 60, loss = 0.0219 Iteration 80, loss = 0.0133 --- Epoch 1093 / 100000 Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0179 Iteration 60, loss = 0.0114 Iteration 80, loss = 0.0168 --- Epoch 1094 / 100000 Iteration 0, loss = 0.0116 Iteration 20, loss = 0.0167 Iteration 40, loss = 0.0246 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0263 --- Epoch 1095 / 100000 Iteration 0, loss = 0.0116 Iteration 20, loss = 0.0201 Iteration 40, loss = 0.0128 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0116 --- Epoch 1096 / 100000 Iteration 0, loss = 0.0136 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0196 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0109 --- Epoch 1097 / 100000 Iteration 0, loss = 0.0149 Iteration 20, loss = 0.0358 Iteration 40, loss = 0.0126 Iteration 60, loss = 0.0254 Iteration 80, loss = 0.0072 --- Epoch 1098 / 100000 Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0145 Iteration 40, loss = 0.0108 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0222 --- Epoch 1099 / 100000 Iteration 0, loss = 0.0183 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0142 Iteration 80, loss = 0.0136 --- Epoch 1100 / 100000 Iteration 0, loss = 0.0130 Iteration 20, loss = 0.0100 Iteration 40, loss = 0.0218 Iteration 60, loss = 0.0134 Iteration 80, loss = 0.0147 --- Epoch 1101 / 100000 Iteration 0, loss = 0.0100 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0133 Iteration 80, loss = 0.0095 --- Epoch 1102 / 100000 Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0126 Iteration 80, loss = 0.0094 --- Epoch 1103 / 100000 Iteration 0, loss = 0.0174 Iteration 20, loss = 0.0161 Iteration 40, loss = 0.0147 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0116 --- Epoch 1104 / 100000 Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0116 Iteration 40, loss = 0.0131 Iteration 60, loss = 0.0131 Iteration 80, loss = 0.0122 --- Epoch 1105 / 100000 Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0096 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0097 Iteration 80, loss = 0.0138 --- Epoch 1106 / 100000 Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0096 --- Epoch 1107 / 100000 Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0100 Iteration 40, loss = 0.0167 Iteration 60, loss = 0.0139 Iteration 80, loss = 0.0108 --- Epoch 1108 / 100000 Iteration 0, loss = 0.0205 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0260 Iteration 60, loss = 0.0229 Iteration 80, loss = 0.0131 --- Epoch 1109 / 100000 Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0136 --- Epoch 1110 / 100000 Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0086 Iteration 40, loss = 0.0283 Iteration 60, loss = 0.0155 Iteration 80, loss = 0.0115 --- Epoch 1111 / 100000 Iteration 0, loss = 0.0083 Iteration 20, loss = 0.0144 Iteration 40, loss = 0.0135 Iteration 60, loss = 0.0147 Iteration 80, loss = 0.0128 --- Epoch 1112 / 100000 Iteration 0, loss = 0.0210 Iteration 20, loss = 0.0114 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0096 --- Epoch 1113 / 100000 Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0210 Iteration 40, loss = 0.0228 Iteration 60, loss = 0.0214 Iteration 80, loss = 0.0114 --- Epoch 1114 / 100000 Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0206 Iteration 80, loss = 0.0201 --- Epoch 1115 / 100000 Iteration 0, loss = 0.0251 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0231 Iteration 60, loss = 0.0194 Iteration 80, loss = 0.0142 --- Epoch 1116 / 100000 Iteration 0, loss = 0.0090 Iteration 20, loss = 0.0210 Iteration 40, loss = 0.0369 Iteration 60, loss = 0.0135 Iteration 80, loss = 0.0231 --- Epoch 1117 / 100000 Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0118 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0087 --- Epoch 1118 / 100000 Iteration 0, loss = 0.0450 Iteration 20, loss = 0.0223 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0143 Iteration 80, loss = 0.0152 --- Epoch 1119 / 100000 Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0127 Iteration 40, loss = 0.0167 Iteration 60, loss = 0.0151 Iteration 80, loss = 0.0093 --- Epoch 1120 / 100000 Iteration 0, loss = 0.0127 Iteration 20, loss = 0.0130 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0173 Iteration 80, loss = 0.0099 --- Epoch 1121 / 100000 Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0136 Iteration 40, loss = 0.0097 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0100 --- Epoch 1122 / 100000 Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0231 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0113 Iteration 80, loss = 0.0148 --- Epoch 1123 / 100000 Iteration 0, loss = 0.0148 Iteration 20, loss = 0.0086 Iteration 40, loss = 0.0097 Iteration 60, loss = 0.0115 Iteration 80, loss = 0.0082 --- Epoch 1124 / 100000 Iteration 0, loss = 0.0179 Iteration 20, loss = 0.0603 Iteration 40, loss = 0.0078 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0412 --- Epoch 1125 / 100000 Iteration 0, loss = 0.0225 Iteration 20, loss = 0.0148 Iteration 40, loss = 0.0145 Iteration 60, loss = 0.0223 Iteration 80, loss = 0.0112 --- Epoch 1126 / 100000 Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0114 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0165 Iteration 80, loss = 0.0098 --- Epoch 1127 / 100000 Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0161 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0096 Iteration 80, loss = 0.0243 --- Epoch 1128 / 100000 Iteration 0, loss = 0.0263 Iteration 20, loss = 0.0144 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0156 --- Epoch 1129 / 100000 Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0173 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0120 Iteration 80, loss = 0.0224
--------------------------------------------------------------------------- KeyboardInterrupt Traceback (most recent call last) <ipython-input-561-b24253d770e1> in <module> ----> 1 train(model8, optimizer, epochs=100000, x_train=data["X_train_class"], y_train=data["y_train_class"], criterion=nn.MSELoss()) <ipython-input-502-f8fe1643891d> in train(model, optimizer, epochs, x_train, y_train, criterion) 27 y = y_batch[t].to(device=device, dtype=dtype) 28 ---> 29 scores = model(x) 30 31 loss = criterion(scores.view(-1), y.view(-1)) /opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/module.py in _call_impl(self, *input, **kwargs) 720 result = self._slow_forward(*input, **kwargs) 721 else: --> 722 result = self.forward(*input, **kwargs) 723 for hook in itertools.chain( 724 _global_forward_hooks.values(), <ipython-input-559-1454e4041bce> in forward(self, x) 35 scores = F.relu(self.batchnorm6(self.conv6(scores))) 36 scores = self.upsample(scores) ---> 37 scores = torch.tanh(self.conv7(scores)) 38 39 # with_x = torch.cat((scores.view(-1), x.view(-1)), 0) /opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/module.py in _call_impl(self, *input, **kwargs) 720 result = self._slow_forward(*input, **kwargs) 721 else: --> 722 result = self.forward(*input, **kwargs) 723 for hook in itertools.chain( 724 _global_forward_hooks.values(), /opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/conv.py in forward(self, input) 417 418 def forward(self, input: Tensor) -> Tensor: --> 419 return self._conv_forward(input, self.weight) 420 421 class Conv3d(_ConvNd): /opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/conv.py in _conv_forward(self, input, weight) 414 _pair(0), self.dilation, self.groups) 415 return F.conv2d(input, weight, self.bias, self.stride, --> 416 self.padding, self.dilation, self.groups) 417 418 def forward(self, input: Tensor) -> Tensor: KeyboardInterrupt:
testModel(model8, x_test=data["X_test_class"], y_test=data["y_test_class"], criterion=nn.L1Loss())
Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers). Clipping input data to the valid range for imshow with RGB data ([0..1] for floats or [0..255] for integers).
class ConvNet4(nn.Module):
def __init__(self):
super().__init__()
self.epochsTrained = 0
self.batchnorm1 = nn.BatchNorm2d(32)
self.batchnorm2 = nn.BatchNorm2d(64)
self.batchnorm3 = nn.BatchNorm2d(128)
self.batchnorm4 = nn.BatchNorm2d(128)
self.batchnorm5 = nn.BatchNorm2d(64)
self.batchnorm6 = nn.BatchNorm2d(32)
self.upsample = nn.Upsample(scale_factor=2, mode='bilinear')
self.conv1 = nn.Conv2d(1, 32, kernel_size=3, padding=1)
self.conv2 = nn.Conv2d(32, 64, kernel_size=3, stride=2, padding=1)
self.conv3 = nn.Conv2d(64, 128, kernel_size=3, stride=2, padding=1)
self.conv4 = nn.Conv2d(128, 128, kernel_size=3, stride=2, padding=1)
self.conv5 = nn.Conv2d(128, 64, kernel_size=3, padding=1)
self.conv6 = nn.Conv2d(64, 32, kernel_size=3, padding=1)
self.conv7 = nn.Conv2d(32, 3, kernel_size=3, padding=1)
def forward(self, x):
x = x[0, :, :].unsqueeze(0).unsqueeze(0)
# Encoder
scores = F.relu(self.batchnorm1(self.conv1(x)))
scores = F.relu(self.batchnorm2(self.conv2(scores)))
scores = F.relu(self.batchnorm3(self.conv3(scores)))
scores = F.relu(self.batchnorm4(self.conv4(scores)))
# Decoder
scores = self.upsample(scores)
scores = F.relu(self.batchnorm5(self.conv5(scores)))
scores = self.upsample(scores)
scores = F.relu(self.batchnorm6(self.conv6(scores)))
scores = self.upsample(scores)
# Add x so scores so network is better learning how to color x but not the structure of x
scores = (torch.tanh(self.conv7(scores)) + x)
# Normalize between 0-1
scores = scores.view(-1)
scores = (scores - torch.min(scores)) / (torch.max(scores) - torch.min(scores))
return scores
learning_rate = 1e-2
model9 = ConvNet4()
optimizer = optim.SGD(model9.parameters(), lr=learning_rate)
train(model9, optimizer, epochs=2000, x_train=data["X_train_ship"], y_train=data["y_train_ship"], criterion=nn.MSELoss())
--- Epoch 1 / 2000 - 1 epochs total Iteration 0, loss = 0.0564 Iteration 20, loss = 0.0359 Iteration 40, loss = 0.0359 Iteration 60, loss = 0.0223 Iteration 80, loss = 0.0284 --- Epoch 2 / 2000 - 2 epochs total Iteration 0, loss = 0.0162 Iteration 20, loss = 0.0177 Iteration 40, loss = 0.0427 Iteration 60, loss = 0.0245 Iteration 80, loss = 0.0186 --- Epoch 3 / 2000 - 3 epochs total Iteration 0, loss = 0.0228 Iteration 20, loss = 0.0115 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0230 Iteration 80, loss = 0.0183 --- Epoch 4 / 2000 - 4 epochs total Iteration 0, loss = 0.0417 Iteration 20, loss = 0.0443 Iteration 40, loss = 0.0128 Iteration 60, loss = 0.0161 Iteration 80, loss = 0.0675 --- Epoch 5 / 2000 - 5 epochs total Iteration 0, loss = 0.0193 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0114 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0118 --- Epoch 6 / 2000 - 6 epochs total Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0150 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0150 Iteration 80, loss = 0.0076 --- Epoch 7 / 2000 - 7 epochs total Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0180 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0143 --- Epoch 8 / 2000 - 8 epochs total Iteration 0, loss = 0.0219 Iteration 20, loss = 0.0189 Iteration 40, loss = 0.0318 Iteration 60, loss = 0.0157 Iteration 80, loss = 0.0137 --- Epoch 9 / 2000 - 9 epochs total Iteration 0, loss = 0.0129 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0164 --- Epoch 10 / 2000 - 10 epochs total Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0291 Iteration 40, loss = 0.0132 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0121 --- Epoch 11 / 2000 - 11 epochs total Iteration 0, loss = 0.0314 Iteration 20, loss = 0.0170 Iteration 40, loss = 0.0447 Iteration 60, loss = 0.0097 Iteration 80, loss = 0.0070 --- Epoch 12 / 2000 - 12 epochs total Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0288 Iteration 40, loss = 0.0146 Iteration 60, loss = 0.0141 Iteration 80, loss = 0.0117 --- Epoch 13 / 2000 - 13 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0363 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0129 --- Epoch 14 / 2000 - 14 epochs total Iteration 0, loss = 0.0284 Iteration 20, loss = 0.0206 Iteration 40, loss = 0.0195 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0171 --- Epoch 15 / 2000 - 15 epochs total Iteration 0, loss = 0.0133 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0159 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0078 --- Epoch 16 / 2000 - 16 epochs total Iteration 0, loss = 0.0404 Iteration 20, loss = 0.0130 Iteration 40, loss = 0.0205 Iteration 60, loss = 0.0150 Iteration 80, loss = 0.0126 --- Epoch 17 / 2000 - 17 epochs total Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0241 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0048 --- Epoch 18 / 2000 - 18 epochs total Iteration 0, loss = 0.0116 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0090 Iteration 60, loss = 0.0474 Iteration 80, loss = 0.0116 --- Epoch 19 / 2000 - 19 epochs total Iteration 0, loss = 0.0165 Iteration 20, loss = 0.0065 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0123 Iteration 80, loss = 0.0031 --- Epoch 20 / 2000 - 20 epochs total Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0129 Iteration 40, loss = 0.0344 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0090 --- Epoch 21 / 2000 - 21 epochs total Iteration 0, loss = 0.0123 Iteration 20, loss = 0.0127 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0162 --- Epoch 22 / 2000 - 22 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0232 Iteration 40, loss = 0.0385 Iteration 60, loss = 0.0295 Iteration 80, loss = 0.0122 --- Epoch 23 / 2000 - 23 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0088 --- Epoch 24 / 2000 - 24 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0149 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0067 --- Epoch 25 / 2000 - 25 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0274 Iteration 60, loss = 0.0083 Iteration 80, loss = 0.0073 --- Epoch 26 / 2000 - 26 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0228 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0054 --- Epoch 27 / 2000 - 27 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0269 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0092 --- Epoch 28 / 2000 - 28 epochs total Iteration 0, loss = 0.0265 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0195 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0057 --- Epoch 29 / 2000 - 29 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0031 --- Epoch 30 / 2000 - 30 epochs total Iteration 0, loss = 0.0582 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0110 --- Epoch 31 / 2000 - 31 epochs total Iteration 0, loss = 0.0164 Iteration 20, loss = 0.0115 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0085 --- Epoch 32 / 2000 - 32 epochs total Iteration 0, loss = 0.0204 Iteration 20, loss = 0.0090 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0302 Iteration 80, loss = 0.0062 --- Epoch 33 / 2000 - 33 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0237 Iteration 80, loss = 0.0166 --- Epoch 34 / 2000 - 34 epochs total Iteration 0, loss = 0.0193 Iteration 20, loss = 0.0124 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0445 --- Epoch 35 / 2000 - 35 epochs total Iteration 0, loss = 0.0220 Iteration 20, loss = 0.0163 Iteration 40, loss = 0.0137 Iteration 60, loss = 0.0138 Iteration 80, loss = 0.0321 --- Epoch 36 / 2000 - 36 epochs total Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0184 Iteration 80, loss = 0.0370 --- Epoch 37 / 2000 - 37 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0133 Iteration 80, loss = 0.0047 --- Epoch 38 / 2000 - 38 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0053 --- Epoch 39 / 2000 - 39 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0248 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0072 --- Epoch 40 / 2000 - 40 epochs total Iteration 0, loss = 0.0161 Iteration 20, loss = 0.0115 Iteration 40, loss = 0.0129 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0062 --- Epoch 41 / 2000 - 41 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0096 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0114 Iteration 80, loss = 0.0171 --- Epoch 42 / 2000 - 42 epochs total Iteration 0, loss = 0.0165 Iteration 20, loss = 0.0161 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0244 Iteration 80, loss = 0.0444 --- Epoch 43 / 2000 - 43 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0116 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0102 --- Epoch 44 / 2000 - 44 epochs total Iteration 0, loss = 0.0144 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0303 --- Epoch 45 / 2000 - 45 epochs total Iteration 0, loss = 0.0149 Iteration 20, loss = 0.0132 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0096 --- Epoch 46 / 2000 - 46 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0131 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0088 --- Epoch 47 / 2000 - 47 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0057 --- Epoch 48 / 2000 - 48 epochs total Iteration 0, loss = 0.0211 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0137 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0190 --- Epoch 49 / 2000 - 49 epochs total Iteration 0, loss = 0.0319 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0083 --- Epoch 50 / 2000 - 50 epochs total Iteration 0, loss = 0.0193 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0141 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0136 --- Epoch 51 / 2000 - 51 epochs total Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0073 --- Epoch 52 / 2000 - 52 epochs total Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0284 Iteration 40, loss = 0.0093 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0096 --- Epoch 53 / 2000 - 53 epochs total Iteration 0, loss = 0.0148 Iteration 20, loss = 0.0175 Iteration 40, loss = 0.0256 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0058 --- Epoch 54 / 2000 - 54 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0241 Iteration 80, loss = 0.0128 --- Epoch 55 / 2000 - 55 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0190 Iteration 60, loss = 0.0210 Iteration 80, loss = 0.0077 --- Epoch 56 / 2000 - 56 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0176 Iteration 60, loss = 0.0132 Iteration 80, loss = 0.0115 --- Epoch 57 / 2000 - 57 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0269 Iteration 40, loss = 0.0227 Iteration 60, loss = 0.0124 Iteration 80, loss = 0.0153 --- Epoch 58 / 2000 - 58 epochs total Iteration 0, loss = 0.0110 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0265 Iteration 60, loss = 0.0177 Iteration 80, loss = 0.0043 --- Epoch 59 / 2000 - 59 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0258 Iteration 60, loss = 0.0238 Iteration 80, loss = 0.0057 --- Epoch 60 / 2000 - 60 epochs total Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0169 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0181 Iteration 80, loss = 0.0071 --- Epoch 61 / 2000 - 61 epochs total Iteration 0, loss = 0.0338 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0150 Iteration 80, loss = 0.0029 --- Epoch 62 / 2000 - 62 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0201 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0049 --- Epoch 63 / 2000 - 63 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0057 --- Epoch 64 / 2000 - 64 epochs total Iteration 0, loss = 0.0446 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0071 --- Epoch 65 / 2000 - 65 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0151 Iteration 80, loss = 0.0065 --- Epoch 66 / 2000 - 66 epochs total Iteration 0, loss = 0.0235 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0209 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0046 --- Epoch 67 / 2000 - 67 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0250 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0177 Iteration 80, loss = 0.0058 --- Epoch 68 / 2000 - 68 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0145 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0139 --- Epoch 69 / 2000 - 69 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0207 Iteration 40, loss = 0.0200 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0352 --- Epoch 70 / 2000 - 70 epochs total Iteration 0, loss = 0.0146 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0052 --- Epoch 71 / 2000 - 71 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0101 --- Epoch 72 / 2000 - 72 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0168 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0076 --- Epoch 73 / 2000 - 73 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0105 Iteration 60, loss = 0.0201 Iteration 80, loss = 0.0107 --- Epoch 74 / 2000 - 74 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0171 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0120 Iteration 80, loss = 0.0086 --- Epoch 75 / 2000 - 75 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0099 Iteration 80, loss = 0.0053 --- Epoch 76 / 2000 - 76 epochs total Iteration 0, loss = 0.0319 Iteration 20, loss = 0.0192 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0096 Iteration 80, loss = 0.0030 --- Epoch 77 / 2000 - 77 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0133 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0063 --- Epoch 78 / 2000 - 78 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0134 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0082 Iteration 80, loss = 0.0041 --- Epoch 79 / 2000 - 79 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0205 Iteration 40, loss = 0.0178 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0030 --- Epoch 80 / 2000 - 80 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0156 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0170 Iteration 80, loss = 0.0073 --- Epoch 81 / 2000 - 81 epochs total Iteration 0, loss = 0.0282 Iteration 20, loss = 0.0254 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0238 --- Epoch 82 / 2000 - 82 epochs total Iteration 0, loss = 0.0129 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0094 --- Epoch 83 / 2000 - 83 epochs total Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0501 Iteration 60, loss = 0.0137 Iteration 80, loss = 0.0133 --- Epoch 84 / 2000 - 84 epochs total Iteration 0, loss = 0.0140 Iteration 20, loss = 0.0206 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0200 --- Epoch 85 / 2000 - 85 epochs total Iteration 0, loss = 0.0100 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0101 Iteration 60, loss = 0.0155 Iteration 80, loss = 0.0037 --- Epoch 86 / 2000 - 86 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0185 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0184 --- Epoch 87 / 2000 - 87 epochs total Iteration 0, loss = 0.0083 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0150 --- Epoch 88 / 2000 - 88 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0156 --- Epoch 89 / 2000 - 89 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0054 --- Epoch 90 / 2000 - 90 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0218 --- Epoch 91 / 2000 - 91 epochs total Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0266 --- Epoch 92 / 2000 - 92 epochs total Iteration 0, loss = 0.0130 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0142 Iteration 80, loss = 0.0377 --- Epoch 93 / 2000 - 93 epochs total Iteration 0, loss = 0.0205 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0036 --- Epoch 94 / 2000 - 94 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0365 Iteration 60, loss = 0.0136 Iteration 80, loss = 0.0058 --- Epoch 95 / 2000 - 95 epochs total Iteration 0, loss = 0.0229 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0121 Iteration 60, loss = 0.0134 Iteration 80, loss = 0.0080 --- Epoch 96 / 2000 - 96 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0078 --- Epoch 97 / 2000 - 97 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0129 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0093 --- Epoch 98 / 2000 - 98 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0114 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0215 --- Epoch 99 / 2000 - 99 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0218 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0083 --- Epoch 100 / 2000 - 100 epochs total Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0174 Iteration 80, loss = 0.0322 --- Epoch 101 / 2000 - 101 epochs total Iteration 0, loss = 0.0140 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0409 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0057 --- Epoch 102 / 2000 - 102 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0142 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0033 --- Epoch 103 / 2000 - 103 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0106 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0067 --- Epoch 104 / 2000 - 104 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0191 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0058 --- Epoch 105 / 2000 - 105 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0111 Iteration 80, loss = 0.0038 --- Epoch 106 / 2000 - 106 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0363 --- Epoch 107 / 2000 - 107 epochs total Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0112 --- Epoch 108 / 2000 - 108 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0319 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0053 --- Epoch 109 / 2000 - 109 epochs total Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0127 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.1290 Iteration 80, loss = 0.0030 --- Epoch 110 / 2000 - 110 epochs total Iteration 0, loss = 0.0070 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0058 --- Epoch 111 / 2000 - 111 epochs total Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0305 Iteration 80, loss = 0.0321 --- Epoch 112 / 2000 - 112 epochs total Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0087 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0044 --- Epoch 113 / 2000 - 113 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0095 --- Epoch 114 / 2000 - 114 epochs total Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0121 --- Epoch 115 / 2000 - 115 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0191 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0027 --- Epoch 116 / 2000 - 116 epochs total Iteration 0, loss = 0.0372 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0120 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0109 --- Epoch 117 / 2000 - 117 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0041 --- Epoch 118 / 2000 - 118 epochs total Iteration 0, loss = 0.0110 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0029 --- Epoch 119 / 2000 - 119 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0243 Iteration 40, loss = 0.0120 Iteration 60, loss = 0.0115 Iteration 80, loss = 0.0041 --- Epoch 120 / 2000 - 120 epochs total Iteration 0, loss = 0.0162 Iteration 20, loss = 0.0154 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0131 --- Epoch 121 / 2000 - 121 epochs total Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0437 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0088 --- Epoch 122 / 2000 - 122 epochs total Iteration 0, loss = 0.0084 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0282 --- Epoch 123 / 2000 - 123 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0145 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0166 Iteration 80, loss = 0.0129 --- Epoch 124 / 2000 - 124 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0232 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0292 Iteration 80, loss = 0.0126 --- Epoch 125 / 2000 - 125 epochs total Iteration 0, loss = 0.0266 Iteration 20, loss = 0.0246 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0014 --- Epoch 126 / 2000 - 126 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0092 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0087 --- Epoch 127 / 2000 - 127 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0328 --- Epoch 128 / 2000 - 128 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0015 --- Epoch 129 / 2000 - 129 epochs total Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0144 --- Epoch 130 / 2000 - 130 epochs total Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0022 --- Epoch 131 / 2000 - 131 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0035 --- Epoch 132 / 2000 - 132 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0126 Iteration 40, loss = 0.0121 Iteration 60, loss = 0.0010 Iteration 80, loss = 0.0054 --- Epoch 133 / 2000 - 133 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0151 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0111 --- Epoch 134 / 2000 - 134 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0050 --- Epoch 135 / 2000 - 135 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0147 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0244 Iteration 80, loss = 0.0012 --- Epoch 136 / 2000 - 136 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0117 Iteration 80, loss = 0.0038 --- Epoch 137 / 2000 - 137 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0158 Iteration 40, loss = 0.0090 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0030 --- Epoch 138 / 2000 - 138 epochs total Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0100 Iteration 40, loss = 0.0141 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0046 --- Epoch 139 / 2000 - 139 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0108 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0020 --- Epoch 140 / 2000 - 140 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0020 --- Epoch 141 / 2000 - 141 epochs total Iteration 0, loss = 0.0151 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0057 --- Epoch 142 / 2000 - 142 epochs total Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0167 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0096 --- Epoch 143 / 2000 - 143 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0031 --- Epoch 144 / 2000 - 144 epochs total Iteration 0, loss = 0.0203 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0025 --- Epoch 145 / 2000 - 145 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0215 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0049 --- Epoch 146 / 2000 - 146 epochs total Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0167 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0014 --- Epoch 147 / 2000 - 147 epochs total Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0130 Iteration 40, loss = 0.0108 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0142 --- Epoch 148 / 2000 - 148 epochs total Iteration 0, loss = 0.0282 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0140 Iteration 80, loss = 0.0082 --- Epoch 149 / 2000 - 149 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0033 --- Epoch 150 / 2000 - 150 epochs total Iteration 0, loss = 0.0227 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0014 --- Epoch 151 / 2000 - 151 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0136 Iteration 40, loss = 0.0652 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0056 --- Epoch 152 / 2000 - 152 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0182 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0088 --- Epoch 153 / 2000 - 153 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0205 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0254 Iteration 80, loss = 0.0312 --- Epoch 154 / 2000 - 154 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0051 --- Epoch 155 / 2000 - 155 epochs total Iteration 0, loss = 0.0169 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0093 --- Epoch 156 / 2000 - 156 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0011 Iteration 80, loss = 0.0117 --- Epoch 157 / 2000 - 157 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0034 --- Epoch 158 / 2000 - 158 epochs total Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0083 Iteration 60, loss = 0.0146 Iteration 80, loss = 0.0060 --- Epoch 159 / 2000 - 159 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0325 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0030 --- Epoch 160 / 2000 - 160 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0047 --- Epoch 161 / 2000 - 161 epochs total Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0189 --- Epoch 162 / 2000 - 162 epochs total Iteration 0, loss = 0.0124 Iteration 20, loss = 0.0149 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0119 --- Epoch 163 / 2000 - 163 epochs total Iteration 0, loss = 0.0136 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0034 --- Epoch 164 / 2000 - 164 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0091 --- Epoch 165 / 2000 - 165 epochs total Iteration 0, loss = 0.0010 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0394 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0294 --- Epoch 166 / 2000 - 166 epochs total Iteration 0, loss = 0.0340 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0189 Iteration 60, loss = 0.0174 Iteration 80, loss = 0.0036 --- Epoch 167 / 2000 - 167 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0203 Iteration 40, loss = 0.0139 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0217 --- Epoch 168 / 2000 - 168 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0046 --- Epoch 169 / 2000 - 169 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0231 --- Epoch 170 / 2000 - 170 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0114 Iteration 60, loss = 0.0165 Iteration 80, loss = 0.0018 --- Epoch 171 / 2000 - 171 epochs total Iteration 0, loss = 0.0164 Iteration 20, loss = 0.0182 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0150 Iteration 80, loss = 0.0143 --- Epoch 172 / 2000 - 172 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0237 Iteration 80, loss = 0.0095 --- Epoch 173 / 2000 - 173 epochs total Iteration 0, loss = 0.0399 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0055 --- Epoch 174 / 2000 - 174 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0084 Iteration 60, loss = 0.0138 Iteration 80, loss = 0.0045 --- Epoch 175 / 2000 - 175 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0247 --- Epoch 176 / 2000 - 176 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0041 --- Epoch 177 / 2000 - 177 epochs total Iteration 0, loss = 0.0181 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0025 --- Epoch 178 / 2000 - 178 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0042 --- Epoch 179 / 2000 - 179 epochs total Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0316 --- Epoch 180 / 2000 - 180 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0037 --- Epoch 181 / 2000 - 181 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0185 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0023 --- Epoch 182 / 2000 - 182 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0092 --- Epoch 183 / 2000 - 183 epochs total Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0112 --- Epoch 184 / 2000 - 184 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0062 --- Epoch 185 / 2000 - 185 epochs total Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0046 --- Epoch 186 / 2000 - 186 epochs total Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0325 Iteration 80, loss = 0.0009 --- Epoch 187 / 2000 - 187 epochs total Iteration 0, loss = 0.0070 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0046 --- Epoch 188 / 2000 - 188 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0320 Iteration 80, loss = 0.0042 --- Epoch 189 / 2000 - 189 epochs total Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0152 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0023 --- Epoch 190 / 2000 - 190 epochs total Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0151 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0158 Iteration 80, loss = 0.0042 --- Epoch 191 / 2000 - 191 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0182 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0053 --- Epoch 192 / 2000 - 192 epochs total Iteration 0, loss = 0.0200 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0119 --- Epoch 193 / 2000 - 193 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0245 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0019 --- Epoch 194 / 2000 - 194 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0100 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0026 --- Epoch 195 / 2000 - 195 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0093 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0042 --- Epoch 196 / 2000 - 196 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0169 Iteration 80, loss = 0.0418 --- Epoch 197 / 2000 - 197 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0099 Iteration 80, loss = 0.0036 --- Epoch 198 / 2000 - 198 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0101 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0128 --- Epoch 199 / 2000 - 199 epochs total Iteration 0, loss = 0.0221 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0050 --- Epoch 200 / 2000 - 200 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0144 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0020 --- Epoch 201 / 2000 - 201 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0138 --- Epoch 202 / 2000 - 202 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0266 Iteration 80, loss = 0.0028 --- Epoch 203 / 2000 - 203 epochs total Iteration 0, loss = 0.0085 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0226 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0169 --- Epoch 204 / 2000 - 204 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0124 Iteration 80, loss = 0.0018 --- Epoch 205 / 2000 - 205 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0031 --- Epoch 206 / 2000 - 206 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0059 --- Epoch 207 / 2000 - 207 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0390 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0049 --- Epoch 208 / 2000 - 208 epochs total Iteration 0, loss = 0.0131 Iteration 20, loss = 0.0151 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0021 --- Epoch 209 / 2000 - 209 epochs total Iteration 0, loss = 0.0101 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0046 --- Epoch 210 / 2000 - 210 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0180 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0121 --- Epoch 211 / 2000 - 211 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0083 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0021 --- Epoch 212 / 2000 - 212 epochs total Iteration 0, loss = 0.0124 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0070 --- Epoch 213 / 2000 - 213 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0102 --- Epoch 214 / 2000 - 214 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0345 Iteration 40, loss = 0.0155 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0027 --- Epoch 215 / 2000 - 215 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0116 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0176 Iteration 80, loss = 0.0087 --- Epoch 216 / 2000 - 216 epochs total Iteration 0, loss = 0.0133 Iteration 20, loss = 0.0277 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0053 --- Epoch 217 / 2000 - 217 epochs total Iteration 0, loss = 0.0084 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0052 --- Epoch 218 / 2000 - 218 epochs total Iteration 0, loss = 0.0360 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0035 --- Epoch 219 / 2000 - 219 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0191 Iteration 60, loss = 0.0116 Iteration 80, loss = 0.0045 --- Epoch 220 / 2000 - 220 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0020 --- Epoch 221 / 2000 - 221 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0018 --- Epoch 222 / 2000 - 222 epochs total Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0123 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0069 --- Epoch 223 / 2000 - 223 epochs total Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0048 --- Epoch 224 / 2000 - 224 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0051 --- Epoch 225 / 2000 - 225 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0017 --- Epoch 226 / 2000 - 226 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0124 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0077 --- Epoch 227 / 2000 - 227 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0052 --- Epoch 228 / 2000 - 228 epochs total Iteration 0, loss = 0.0213 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0078 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0060 --- Epoch 229 / 2000 - 229 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0059 --- Epoch 230 / 2000 - 230 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0116 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0099 --- Epoch 231 / 2000 - 231 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0477 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0081 --- Epoch 232 / 2000 - 232 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0093 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0062 --- Epoch 233 / 2000 - 233 epochs total Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0047 --- Epoch 234 / 2000 - 234 epochs total Iteration 0, loss = 0.0187 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0051 --- Epoch 235 / 2000 - 235 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0062 --- Epoch 236 / 2000 - 236 epochs total Iteration 0, loss = 0.0113 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0147 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0023 --- Epoch 237 / 2000 - 237 epochs total Iteration 0, loss = 0.0237 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0065 --- Epoch 238 / 2000 - 238 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0039 --- Epoch 239 / 2000 - 239 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0106 Iteration 60, loss = 0.0280 Iteration 80, loss = 0.0061 --- Epoch 240 / 2000 - 240 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0025 --- Epoch 241 / 2000 - 241 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0051 --- Epoch 242 / 2000 - 242 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0217 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0034 --- Epoch 243 / 2000 - 243 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0065 --- Epoch 244 / 2000 - 244 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0097 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0089 --- Epoch 245 / 2000 - 245 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0025 --- Epoch 246 / 2000 - 246 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0070 --- Epoch 247 / 2000 - 247 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0118 --- Epoch 248 / 2000 - 248 epochs total Iteration 0, loss = 0.0124 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0061 --- Epoch 249 / 2000 - 249 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0024 --- Epoch 250 / 2000 - 250 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0165 --- Epoch 251 / 2000 - 251 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0153 Iteration 80, loss = 0.0070 --- Epoch 252 / 2000 - 252 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0058 --- Epoch 253 / 2000 - 253 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0049 --- Epoch 254 / 2000 - 254 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0326 Iteration 60, loss = 0.0132 Iteration 80, loss = 0.0076 --- Epoch 255 / 2000 - 255 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0032 --- Epoch 256 / 2000 - 256 epochs total Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0184 --- Epoch 257 / 2000 - 257 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0042 --- Epoch 258 / 2000 - 258 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0071 --- Epoch 259 / 2000 - 259 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0190 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0062 --- Epoch 260 / 2000 - 260 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0087 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0097 --- Epoch 261 / 2000 - 261 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0073 --- Epoch 262 / 2000 - 262 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0041 --- Epoch 263 / 2000 - 263 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0221 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0036 --- Epoch 264 / 2000 - 264 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0026 --- Epoch 265 / 2000 - 265 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0009 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0099 --- Epoch 266 / 2000 - 266 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0176 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0091 --- Epoch 267 / 2000 - 267 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0134 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0129 --- Epoch 268 / 2000 - 268 epochs total Iteration 0, loss = 0.0185 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0103 --- Epoch 269 / 2000 - 269 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0109 Iteration 40, loss = 0.0142 Iteration 60, loss = 0.0134 Iteration 80, loss = 0.0060 --- Epoch 270 / 2000 - 270 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0099 Iteration 80, loss = 0.0045 --- Epoch 271 / 2000 - 271 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0020 --- Epoch 272 / 2000 - 272 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0112 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0075 --- Epoch 273 / 2000 - 273 epochs total Iteration 0, loss = 0.0205 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0035 --- Epoch 274 / 2000 - 274 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0089 --- Epoch 275 / 2000 - 275 epochs total Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0026 --- Epoch 276 / 2000 - 276 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0109 --- Epoch 277 / 2000 - 277 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0118 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0065 --- Epoch 278 / 2000 - 278 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0134 Iteration 60, loss = 0.0120 Iteration 80, loss = 0.0341 --- Epoch 279 / 2000 - 279 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0132 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0139 --- Epoch 280 / 2000 - 280 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0083 Iteration 80, loss = 0.0023 --- Epoch 281 / 2000 - 281 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0152 Iteration 80, loss = 0.0043 --- Epoch 282 / 2000 - 282 epochs total Iteration 0, loss = 0.0128 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0206 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0040 --- Epoch 283 / 2000 - 283 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0122 --- Epoch 284 / 2000 - 284 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0403 --- Epoch 285 / 2000 - 285 epochs total Iteration 0, loss = 0.0198 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0106 --- Epoch 286 / 2000 - 286 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0090 --- Epoch 287 / 2000 - 287 epochs total Iteration 0, loss = 0.0090 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0323 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0070 --- Epoch 288 / 2000 - 288 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0233 Iteration 80, loss = 0.0013 --- Epoch 289 / 2000 - 289 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0014 --- Epoch 290 / 2000 - 290 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0037 --- Epoch 291 / 2000 - 291 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0052 --- Epoch 292 / 2000 - 292 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0298 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0096 --- Epoch 293 / 2000 - 293 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0154 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0050 --- Epoch 294 / 2000 - 294 epochs total Iteration 0, loss = 0.0101 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0200 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0015 --- Epoch 295 / 2000 - 295 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0256 Iteration 80, loss = 0.0050 --- Epoch 296 / 2000 - 296 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0373 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0045 --- Epoch 297 / 2000 - 297 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0174 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0089 --- Epoch 298 / 2000 - 298 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0075 --- Epoch 299 / 2000 - 299 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0226 Iteration 80, loss = 0.0057 --- Epoch 300 / 2000 - 300 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0085 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0053 --- Epoch 301 / 2000 - 301 epochs total Iteration 0, loss = 0.0199 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0118 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0043 --- Epoch 302 / 2000 - 302 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0271 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0016 --- Epoch 303 / 2000 - 303 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0027 --- Epoch 304 / 2000 - 304 epochs total Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0195 Iteration 40, loss = 0.0165 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0058 --- Epoch 305 / 2000 - 305 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0123 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0086 --- Epoch 306 / 2000 - 306 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0055 --- Epoch 307 / 2000 - 307 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0089 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0093 --- Epoch 308 / 2000 - 308 epochs total Iteration 0, loss = 0.0152 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0024 --- Epoch 309 / 2000 - 309 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0232 Iteration 40, loss = 0.0173 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0057 --- Epoch 310 / 2000 - 310 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0035 --- Epoch 311 / 2000 - 311 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0015 --- Epoch 312 / 2000 - 312 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0007 Iteration 40, loss = 0.0163 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0020 --- Epoch 313 / 2000 - 313 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0050 --- Epoch 314 / 2000 - 314 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0147 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0061 --- Epoch 315 / 2000 - 315 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0124 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0080 --- Epoch 316 / 2000 - 316 epochs total Iteration 0, loss = 0.0306 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0117 Iteration 80, loss = 0.0030 --- Epoch 317 / 2000 - 317 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0083 Iteration 60, loss = 0.0306 Iteration 80, loss = 0.0042 --- Epoch 318 / 2000 - 318 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0281 Iteration 80, loss = 0.0022 --- Epoch 319 / 2000 - 319 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0031 --- Epoch 320 / 2000 - 320 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0042 --- Epoch 321 / 2000 - 321 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0075 --- Epoch 322 / 2000 - 322 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0099 --- Epoch 323 / 2000 - 323 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0168 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0017 --- Epoch 324 / 2000 - 324 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0079 --- Epoch 325 / 2000 - 325 epochs total Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0013 --- Epoch 326 / 2000 - 326 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0072 --- Epoch 327 / 2000 - 327 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0143 --- Epoch 328 / 2000 - 328 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0350 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0051 --- Epoch 329 / 2000 - 329 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0120 Iteration 80, loss = 0.0078 --- Epoch 330 / 2000 - 330 epochs total Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0306 Iteration 80, loss = 0.0029 --- Epoch 331 / 2000 - 331 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0147 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0106 --- Epoch 332 / 2000 - 332 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0020 --- Epoch 333 / 2000 - 333 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0182 --- Epoch 334 / 2000 - 334 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0009 Iteration 80, loss = 0.0074 --- Epoch 335 / 2000 - 335 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0110 --- Epoch 336 / 2000 - 336 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0039 --- Epoch 337 / 2000 - 337 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0210 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0137 --- Epoch 338 / 2000 - 338 epochs total Iteration 0, loss = 0.0182 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0019 --- Epoch 339 / 2000 - 339 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0126 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0034 --- Epoch 340 / 2000 - 340 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0118 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0186 --- Epoch 341 / 2000 - 341 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0099 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0023 --- Epoch 342 / 2000 - 342 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0294 --- Epoch 343 / 2000 - 343 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0021 --- Epoch 344 / 2000 - 344 epochs total Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0228 --- Epoch 345 / 2000 - 345 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0081 --- Epoch 346 / 2000 - 346 epochs total Iteration 0, loss = 0.0116 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0110 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0127 --- Epoch 347 / 2000 - 347 epochs total Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0141 Iteration 40, loss = 0.0139 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0063 --- Epoch 348 / 2000 - 348 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0042 --- Epoch 349 / 2000 - 349 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0176 --- Epoch 350 / 2000 - 350 epochs total Iteration 0, loss = 0.0226 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0114 Iteration 80, loss = 0.0041 --- Epoch 351 / 2000 - 351 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0039 --- Epoch 352 / 2000 - 352 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0028 --- Epoch 353 / 2000 - 353 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0131 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0051 --- Epoch 354 / 2000 - 354 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0023 --- Epoch 355 / 2000 - 355 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0130 --- Epoch 356 / 2000 - 356 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0126 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0089 --- Epoch 357 / 2000 - 357 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0059 --- Epoch 358 / 2000 - 358 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0108 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0017 --- Epoch 359 / 2000 - 359 epochs total Iteration 0, loss = 0.0380 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0011 Iteration 80, loss = 0.0089 --- Epoch 360 / 2000 - 360 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0026 --- Epoch 361 / 2000 - 361 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0192 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0130 Iteration 80, loss = 0.0054 --- Epoch 362 / 2000 - 362 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0101 Iteration 80, loss = 0.0010 --- Epoch 363 / 2000 - 363 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0048 --- Epoch 364 / 2000 - 364 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0016 --- Epoch 365 / 2000 - 365 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0251 Iteration 80, loss = 0.0017 --- Epoch 366 / 2000 - 366 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0095 --- Epoch 367 / 2000 - 367 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0019 --- Epoch 368 / 2000 - 368 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0037 --- Epoch 369 / 2000 - 369 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0117 Iteration 40, loss = 0.0243 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0033 --- Epoch 370 / 2000 - 370 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0088 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0254 --- Epoch 371 / 2000 - 371 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0142 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0119 --- Epoch 372 / 2000 - 372 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0049 --- Epoch 373 / 2000 - 373 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0198 Iteration 80, loss = 0.0058 --- Epoch 374 / 2000 - 374 epochs total Iteration 0, loss = 0.0346 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0031 --- Epoch 375 / 2000 - 375 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0166 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0143 --- Epoch 376 / 2000 - 376 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0097 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0019 --- Epoch 377 / 2000 - 377 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0193 --- Epoch 378 / 2000 - 378 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0039 --- Epoch 379 / 2000 - 379 epochs total Iteration 0, loss = 0.0201 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0015 --- Epoch 380 / 2000 - 380 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0073 --- Epoch 381 / 2000 - 381 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0085 --- Epoch 382 / 2000 - 382 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0051 --- Epoch 383 / 2000 - 383 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0259 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0026 --- Epoch 384 / 2000 - 384 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0021 --- Epoch 385 / 2000 - 385 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0116 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0084 --- Epoch 386 / 2000 - 386 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0038 --- Epoch 387 / 2000 - 387 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0166 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0045 --- Epoch 388 / 2000 - 388 epochs total Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0116 --- Epoch 389 / 2000 - 389 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0046 --- Epoch 390 / 2000 - 390 epochs total Iteration 0, loss = 0.0140 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0092 --- Epoch 391 / 2000 - 391 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0326 --- Epoch 392 / 2000 - 392 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0282 Iteration 60, loss = 0.0199 Iteration 80, loss = 0.0041 --- Epoch 393 / 2000 - 393 epochs total Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0178 --- Epoch 394 / 2000 - 394 epochs total Iteration 0, loss = 0.0104 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0053 --- Epoch 395 / 2000 - 395 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0049 --- Epoch 396 / 2000 - 396 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0087 --- Epoch 397 / 2000 - 397 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0091 --- Epoch 398 / 2000 - 398 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0122 --- Epoch 399 / 2000 - 399 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0027 --- Epoch 400 / 2000 - 400 epochs total Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0044 --- Epoch 401 / 2000 - 401 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0287 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0064 --- Epoch 402 / 2000 - 402 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0131 --- Epoch 403 / 2000 - 403 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0025 --- Epoch 404 / 2000 - 404 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0038 --- Epoch 405 / 2000 - 405 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0039 --- Epoch 406 / 2000 - 406 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0187 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0014 --- Epoch 407 / 2000 - 407 epochs total Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0142 Iteration 40, loss = 0.0157 Iteration 60, loss = 0.0146 Iteration 80, loss = 0.0074 --- Epoch 408 / 2000 - 408 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0352 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0013 --- Epoch 409 / 2000 - 409 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0034 --- Epoch 410 / 2000 - 410 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0048 --- Epoch 411 / 2000 - 411 epochs total Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0055 --- Epoch 412 / 2000 - 412 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0320 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0021 --- Epoch 413 / 2000 - 413 epochs total Iteration 0, loss = 0.0155 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0046 --- Epoch 414 / 2000 - 414 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0044 --- Epoch 415 / 2000 - 415 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0036 --- Epoch 416 / 2000 - 416 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0045 --- Epoch 417 / 2000 - 417 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0083 Iteration 80, loss = 0.0026 --- Epoch 418 / 2000 - 418 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0337 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0070 --- Epoch 419 / 2000 - 419 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0078 --- Epoch 420 / 2000 - 420 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0117 Iteration 80, loss = 0.0036 --- Epoch 421 / 2000 - 421 epochs total Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0039 --- Epoch 422 / 2000 - 422 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0137 --- Epoch 423 / 2000 - 423 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0010 --- Epoch 424 / 2000 - 424 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0097 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0025 --- Epoch 425 / 2000 - 425 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0188 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0040 --- Epoch 426 / 2000 - 426 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0100 --- Epoch 427 / 2000 - 427 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0232 --- Epoch 428 / 2000 - 428 epochs total Iteration 0, loss = 0.0138 Iteration 20, loss = 0.0378 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0139 Iteration 80, loss = 0.0029 --- Epoch 429 / 2000 - 429 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0023 --- Epoch 430 / 2000 - 430 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0052 --- Epoch 431 / 2000 - 431 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0092 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0025 --- Epoch 432 / 2000 - 432 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0099 Iteration 80, loss = 0.0051 --- Epoch 433 / 2000 - 433 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0052 --- Epoch 434 / 2000 - 434 epochs total Iteration 0, loss = 0.0181 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0029 --- Epoch 435 / 2000 - 435 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0059 --- Epoch 436 / 2000 - 436 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0144 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0059 --- Epoch 437 / 2000 - 437 epochs total Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0065 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0165 Iteration 80, loss = 0.0089 --- Epoch 438 / 2000 - 438 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0007 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0089 --- Epoch 439 / 2000 - 439 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0207 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0024 --- Epoch 440 / 2000 - 440 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0048 --- Epoch 441 / 2000 - 441 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0109 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0099 Iteration 80, loss = 0.0121 --- Epoch 442 / 2000 - 442 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0062 --- Epoch 443 / 2000 - 443 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0200 --- Epoch 444 / 2000 - 444 epochs total Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0106 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0057 --- Epoch 445 / 2000 - 445 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0018 --- Epoch 446 / 2000 - 446 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0083 Iteration 80, loss = 0.0038 --- Epoch 447 / 2000 - 447 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0018 --- Epoch 448 / 2000 - 448 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0267 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0015 --- Epoch 449 / 2000 - 449 epochs total Iteration 0, loss = 0.0196 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0028 --- Epoch 450 / 2000 - 450 epochs total Iteration 0, loss = 0.0289 Iteration 20, loss = 0.0190 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0062 --- Epoch 451 / 2000 - 451 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0106 --- Epoch 452 / 2000 - 452 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0037 --- Epoch 453 / 2000 - 453 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0048 --- Epoch 454 / 2000 - 454 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0126 Iteration 80, loss = 0.0084 --- Epoch 455 / 2000 - 455 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0016 --- Epoch 456 / 2000 - 456 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0135 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0038 --- Epoch 457 / 2000 - 457 epochs total Iteration 0, loss = 0.0070 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0020 --- Epoch 458 / 2000 - 458 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0101 Iteration 80, loss = 0.0043 --- Epoch 459 / 2000 - 459 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0248 Iteration 80, loss = 0.0038 --- Epoch 460 / 2000 - 460 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0139 Iteration 80, loss = 0.0098 --- Epoch 461 / 2000 - 461 epochs total Iteration 0, loss = 0.0159 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0136 --- Epoch 462 / 2000 - 462 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0042 --- Epoch 463 / 2000 - 463 epochs total Iteration 0, loss = 0.0331 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0039 --- Epoch 464 / 2000 - 464 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0118 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0032 --- Epoch 465 / 2000 - 465 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0107 --- Epoch 466 / 2000 - 466 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0075 --- Epoch 467 / 2000 - 467 epochs total Iteration 0, loss = 0.0231 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0101 --- Epoch 468 / 2000 - 468 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0075 --- Epoch 469 / 2000 - 469 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0037 --- Epoch 470 / 2000 - 470 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0440 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0019 --- Epoch 471 / 2000 - 471 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0019 --- Epoch 472 / 2000 - 472 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0121 --- Epoch 473 / 2000 - 473 epochs total Iteration 0, loss = 0.0266 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0121 Iteration 80, loss = 0.0022 --- Epoch 474 / 2000 - 474 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0043 --- Epoch 475 / 2000 - 475 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0037 --- Epoch 476 / 2000 - 476 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0021 --- Epoch 477 / 2000 - 477 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0040 --- Epoch 478 / 2000 - 478 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0124 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0171 Iteration 80, loss = 0.0084 --- Epoch 479 / 2000 - 479 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0085 --- Epoch 480 / 2000 - 480 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0154 --- Epoch 481 / 2000 - 481 epochs total Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0022 --- Epoch 482 / 2000 - 482 epochs total Iteration 0, loss = 0.0183 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0097 --- Epoch 483 / 2000 - 483 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0019 --- Epoch 484 / 2000 - 484 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0263 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0083 Iteration 80, loss = 0.0105 --- Epoch 485 / 2000 - 485 epochs total Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0154 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0077 --- Epoch 486 / 2000 - 486 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0062 --- Epoch 487 / 2000 - 487 epochs total Iteration 0, loss = 0.0347 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0028 --- Epoch 488 / 2000 - 488 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0085 --- Epoch 489 / 2000 - 489 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0028 --- Epoch 490 / 2000 - 490 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0216 Iteration 60, loss = 0.0236 Iteration 80, loss = 0.0053 --- Epoch 491 / 2000 - 491 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0180 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0122 --- Epoch 492 / 2000 - 492 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0013 --- Epoch 493 / 2000 - 493 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0034 --- Epoch 494 / 2000 - 494 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0011 --- Epoch 495 / 2000 - 495 epochs total Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0188 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0012 --- Epoch 496 / 2000 - 496 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0062 --- Epoch 497 / 2000 - 497 epochs total Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0177 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0057 --- Epoch 498 / 2000 - 498 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0183 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0045 --- Epoch 499 / 2000 - 499 epochs total Iteration 0, loss = 0.0010 Iteration 20, loss = 0.0144 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0021 --- Epoch 500 / 2000 - 500 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0033 --- Epoch 501 / 2000 - 501 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0017 --- Epoch 502 / 2000 - 502 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0151 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0016 --- Epoch 503 / 2000 - 503 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0025 --- Epoch 504 / 2000 - 504 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0129 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0074 --- Epoch 505 / 2000 - 505 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0249 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0054 --- Epoch 506 / 2000 - 506 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0068 --- Epoch 507 / 2000 - 507 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0102 --- Epoch 508 / 2000 - 508 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0309 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0050 --- Epoch 509 / 2000 - 509 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0013 --- Epoch 510 / 2000 - 510 epochs total Iteration 0, loss = 0.0097 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0047 --- Epoch 511 / 2000 - 511 epochs total Iteration 0, loss = 0.0130 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0241 Iteration 80, loss = 0.0061 --- Epoch 512 / 2000 - 512 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0080 --- Epoch 513 / 2000 - 513 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0017 --- Epoch 514 / 2000 - 514 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0105 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0068 --- Epoch 515 / 2000 - 515 epochs total Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0081 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0027 --- Epoch 516 / 2000 - 516 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0051 --- Epoch 517 / 2000 - 517 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0150 --- Epoch 518 / 2000 - 518 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0060 --- Epoch 519 / 2000 - 519 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0187 --- Epoch 520 / 2000 - 520 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0207 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0122 --- Epoch 521 / 2000 - 521 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0233 --- Epoch 522 / 2000 - 522 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0033 --- Epoch 523 / 2000 - 523 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0034 --- Epoch 524 / 2000 - 524 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0054 --- Epoch 525 / 2000 - 525 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0040 --- Epoch 526 / 2000 - 526 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0034 --- Epoch 527 / 2000 - 527 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0071 --- Epoch 528 / 2000 - 528 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0169 Iteration 80, loss = 0.0145 --- Epoch 529 / 2000 - 529 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0108 Iteration 60, loss = 0.0198 Iteration 80, loss = 0.0070 --- Epoch 530 / 2000 - 530 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0016 --- Epoch 531 / 2000 - 531 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0023 --- Epoch 532 / 2000 - 532 epochs total Iteration 0, loss = 0.0165 Iteration 20, loss = 0.0134 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0050 --- Epoch 533 / 2000 - 533 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0155 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0069 --- Epoch 534 / 2000 - 534 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0057 --- Epoch 535 / 2000 - 535 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0300 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0167 --- Epoch 536 / 2000 - 536 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0025 --- Epoch 537 / 2000 - 537 epochs total Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0192 --- Epoch 538 / 2000 - 538 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0088 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0026 --- Epoch 539 / 2000 - 539 epochs total Iteration 0, loss = 0.0124 Iteration 20, loss = 0.0189 Iteration 40, loss = 0.0110 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0027 --- Epoch 540 / 2000 - 540 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0013 --- Epoch 541 / 2000 - 541 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0101 Iteration 80, loss = 0.0094 --- Epoch 542 / 2000 - 542 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0125 Iteration 80, loss = 0.0085 --- Epoch 543 / 2000 - 543 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0082 --- Epoch 544 / 2000 - 544 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0099 --- Epoch 545 / 2000 - 545 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0046 --- Epoch 546 / 2000 - 546 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0101 Iteration 80, loss = 0.0049 --- Epoch 547 / 2000 - 547 epochs total Iteration 0, loss = 0.0146 Iteration 20, loss = 0.0131 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0034 --- Epoch 548 / 2000 - 548 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0245 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0091 --- Epoch 549 / 2000 - 549 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0123 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0013 --- Epoch 550 / 2000 - 550 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0020 --- Epoch 551 / 2000 - 551 epochs total Iteration 0, loss = 0.0123 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0023 --- Epoch 552 / 2000 - 552 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0068 --- Epoch 553 / 2000 - 553 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0089 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0080 --- Epoch 554 / 2000 - 554 epochs total Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0050 --- Epoch 555 / 2000 - 555 epochs total Iteration 0, loss = 0.0123 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0106 --- Epoch 556 / 2000 - 556 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0023 --- Epoch 557 / 2000 - 557 epochs total Iteration 0, loss = 0.0231 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0068 --- Epoch 558 / 2000 - 558 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0064 --- Epoch 559 / 2000 - 559 epochs total Iteration 0, loss = 0.0181 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0020 --- Epoch 560 / 2000 - 560 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0114 --- Epoch 561 / 2000 - 561 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0048 --- Epoch 562 / 2000 - 562 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0097 Iteration 80, loss = 0.0022 --- Epoch 563 / 2000 - 563 epochs total Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0065 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0076 --- Epoch 564 / 2000 - 564 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0054 --- Epoch 565 / 2000 - 565 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0050 --- Epoch 566 / 2000 - 566 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0035 --- Epoch 567 / 2000 - 567 epochs total Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0132 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0093 --- Epoch 568 / 2000 - 568 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0083 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0231 --- Epoch 569 / 2000 - 569 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0144 --- Epoch 570 / 2000 - 570 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0123 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0034 --- Epoch 571 / 2000 - 571 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0031 --- Epoch 572 / 2000 - 572 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0142 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0074 --- Epoch 573 / 2000 - 573 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0119 --- Epoch 574 / 2000 - 574 epochs total Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0035 --- Epoch 575 / 2000 - 575 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0093 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0137 --- Epoch 576 / 2000 - 576 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0063 --- Epoch 577 / 2000 - 577 epochs total Iteration 0, loss = 0.0085 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0015 --- Epoch 578 / 2000 - 578 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0037 --- Epoch 579 / 2000 - 579 epochs total Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0045 --- Epoch 580 / 2000 - 580 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0143 Iteration 80, loss = 0.0016 --- Epoch 581 / 2000 - 581 epochs total Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0016 --- Epoch 582 / 2000 - 582 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0109 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0071 --- Epoch 583 / 2000 - 583 epochs total Iteration 0, loss = 0.0113 Iteration 20, loss = 0.0065 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0105 --- Epoch 584 / 2000 - 584 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0030 --- Epoch 585 / 2000 - 585 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0022 --- Epoch 586 / 2000 - 586 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0022 --- Epoch 587 / 2000 - 587 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0041 --- Epoch 588 / 2000 - 588 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0133 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0043 --- Epoch 589 / 2000 - 589 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0053 --- Epoch 590 / 2000 - 590 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0035 --- Epoch 591 / 2000 - 591 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0019 --- Epoch 592 / 2000 - 592 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0116 Iteration 80, loss = 0.0054 --- Epoch 593 / 2000 - 593 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0090 --- Epoch 594 / 2000 - 594 epochs total Iteration 0, loss = 0.0493 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0032 --- Epoch 595 / 2000 - 595 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0165 Iteration 40, loss = 0.0121 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0083 --- Epoch 596 / 2000 - 596 epochs total Iteration 0, loss = 0.0100 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0023 --- Epoch 597 / 2000 - 597 epochs total Iteration 0, loss = 0.0204 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0157 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0025 --- Epoch 598 / 2000 - 598 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0037 --- Epoch 599 / 2000 - 599 epochs total Iteration 0, loss = 0.0223 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0025 --- Epoch 600 / 2000 - 600 epochs total Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0105 Iteration 60, loss = 0.0131 Iteration 80, loss = 0.0039 --- Epoch 601 / 2000 - 601 epochs total Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0234 Iteration 80, loss = 0.0014 --- Epoch 602 / 2000 - 602 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0078 --- Epoch 603 / 2000 - 603 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0009 Iteration 80, loss = 0.0038 --- Epoch 604 / 2000 - 604 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0093 --- Epoch 605 / 2000 - 605 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0041 --- Epoch 606 / 2000 - 606 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0136 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0116 --- Epoch 607 / 2000 - 607 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0176 Iteration 80, loss = 0.0027 --- Epoch 608 / 2000 - 608 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0152 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0055 --- Epoch 609 / 2000 - 609 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0078 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0104 --- Epoch 610 / 2000 - 610 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0215 --- Epoch 611 / 2000 - 611 epochs total Iteration 0, loss = 0.0215 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0220 Iteration 80, loss = 0.0020 --- Epoch 612 / 2000 - 612 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0082 Iteration 80, loss = 0.0047 --- Epoch 613 / 2000 - 613 epochs total Iteration 0, loss = 0.0204 Iteration 20, loss = 0.0145 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0118 --- Epoch 614 / 2000 - 614 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0013 --- Epoch 615 / 2000 - 615 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0218 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0045 --- Epoch 616 / 2000 - 616 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0027 --- Epoch 617 / 2000 - 617 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0060 --- Epoch 618 / 2000 - 618 epochs total Iteration 0, loss = 0.0116 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0037 --- Epoch 619 / 2000 - 619 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0037 --- Epoch 620 / 2000 - 620 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0102 Iteration 80, loss = 0.0130 --- Epoch 621 / 2000 - 621 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0037 --- Epoch 622 / 2000 - 622 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0136 Iteration 80, loss = 0.0023 --- Epoch 623 / 2000 - 623 epochs total Iteration 0, loss = 0.0083 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0069 --- Epoch 624 / 2000 - 624 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0144 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0071 --- Epoch 625 / 2000 - 625 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0010 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0275 --- Epoch 626 / 2000 - 626 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0017 --- Epoch 627 / 2000 - 627 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0121 --- Epoch 628 / 2000 - 628 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0030 --- Epoch 629 / 2000 - 629 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0017 --- Epoch 630 / 2000 - 630 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0064 --- Epoch 631 / 2000 - 631 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0044 --- Epoch 632 / 2000 - 632 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0163 Iteration 80, loss = 0.0009 --- Epoch 633 / 2000 - 633 epochs total Iteration 0, loss = 0.0148 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0019 --- Epoch 634 / 2000 - 634 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0075 --- Epoch 635 / 2000 - 635 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0140 --- Epoch 636 / 2000 - 636 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0058 --- Epoch 637 / 2000 - 637 epochs total Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0069 --- Epoch 638 / 2000 - 638 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0155 Iteration 80, loss = 0.0028 --- Epoch 639 / 2000 - 639 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0233 Iteration 80, loss = 0.0108 --- Epoch 640 / 2000 - 640 epochs total Iteration 0, loss = 0.0103 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0017 --- Epoch 641 / 2000 - 641 epochs total Iteration 0, loss = 0.0097 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0088 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0042 --- Epoch 642 / 2000 - 642 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0226 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0025 --- Epoch 643 / 2000 - 643 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0041 --- Epoch 644 / 2000 - 644 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0072 --- Epoch 645 / 2000 - 645 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0028 --- Epoch 646 / 2000 - 646 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0190 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0037 --- Epoch 647 / 2000 - 647 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0173 --- Epoch 648 / 2000 - 648 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0080 --- Epoch 649 / 2000 - 649 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0126 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0028 --- Epoch 650 / 2000 - 650 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0128 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0034 --- Epoch 651 / 2000 - 651 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0025 --- Epoch 652 / 2000 - 652 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0019 --- Epoch 653 / 2000 - 653 epochs total Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0028 --- Epoch 654 / 2000 - 654 epochs total Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0140 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0350 --- Epoch 655 / 2000 - 655 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0101 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0056 --- Epoch 656 / 2000 - 656 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0124 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0018 --- Epoch 657 / 2000 - 657 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0117 Iteration 80, loss = 0.0019 --- Epoch 658 / 2000 - 658 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0024 --- Epoch 659 / 2000 - 659 epochs total Iteration 0, loss = 0.0243 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0057 --- Epoch 660 / 2000 - 660 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0279 Iteration 80, loss = 0.0022 --- Epoch 661 / 2000 - 661 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0031 --- Epoch 662 / 2000 - 662 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0076 --- Epoch 663 / 2000 - 663 epochs total Iteration 0, loss = 0.0215 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0033 --- Epoch 664 / 2000 - 664 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0058 --- Epoch 665 / 2000 - 665 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0363 --- Epoch 666 / 2000 - 666 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0043 --- Epoch 667 / 2000 - 667 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0015 --- Epoch 668 / 2000 - 668 epochs total Iteration 0, loss = 0.0096 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0130 --- Epoch 669 / 2000 - 669 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0021 --- Epoch 670 / 2000 - 670 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0124 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0141 --- Epoch 671 / 2000 - 671 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0038 --- Epoch 672 / 2000 - 672 epochs total Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0224 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0015 --- Epoch 673 / 2000 - 673 epochs total Iteration 0, loss = 0.0245 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0147 --- Epoch 674 / 2000 - 674 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0132 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0102 --- Epoch 675 / 2000 - 675 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0449 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0025 --- Epoch 676 / 2000 - 676 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0163 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0040 --- Epoch 677 / 2000 - 677 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0013 --- Epoch 678 / 2000 - 678 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0017 --- Epoch 679 / 2000 - 679 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0231 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0129 --- Epoch 680 / 2000 - 680 epochs total Iteration 0, loss = 0.0220 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0149 --- Epoch 681 / 2000 - 681 epochs total Iteration 0, loss = 0.0149 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0016 --- Epoch 682 / 2000 - 682 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0051 --- Epoch 683 / 2000 - 683 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0014 --- Epoch 684 / 2000 - 684 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0203 Iteration 80, loss = 0.0036 --- Epoch 685 / 2000 - 685 epochs total Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0365 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0044 --- Epoch 686 / 2000 - 686 epochs total Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0025 --- Epoch 687 / 2000 - 687 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0027 --- Epoch 688 / 2000 - 688 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0062 --- Epoch 689 / 2000 - 689 epochs total Iteration 0, loss = 0.0116 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0023 --- Epoch 690 / 2000 - 690 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0051 --- Epoch 691 / 2000 - 691 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0185 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0022 --- Epoch 692 / 2000 - 692 epochs total Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0051 --- Epoch 693 / 2000 - 693 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0052 --- Epoch 694 / 2000 - 694 epochs total Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0035 --- Epoch 695 / 2000 - 695 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0085 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0087 --- Epoch 696 / 2000 - 696 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0025 --- Epoch 697 / 2000 - 697 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0069 --- Epoch 698 / 2000 - 698 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0044 --- Epoch 699 / 2000 - 699 epochs total Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0014 --- Epoch 700 / 2000 - 700 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0113 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0039 --- Epoch 701 / 2000 - 701 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0210 --- Epoch 702 / 2000 - 702 epochs total Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0021 --- Epoch 703 / 2000 - 703 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0025 --- Epoch 704 / 2000 - 704 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0187 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0193 --- Epoch 705 / 2000 - 705 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0228 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0015 --- Epoch 706 / 2000 - 706 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0037 --- Epoch 707 / 2000 - 707 epochs total Iteration 0, loss = 0.0180 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0032 --- Epoch 708 / 2000 - 708 epochs total Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0064 --- Epoch 709 / 2000 - 709 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0037 --- Epoch 710 / 2000 - 710 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0061 --- Epoch 711 / 2000 - 711 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0146 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0051 --- Epoch 712 / 2000 - 712 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0164 Iteration 80, loss = 0.0024 --- Epoch 713 / 2000 - 713 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0044 --- Epoch 714 / 2000 - 714 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0131 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0025 --- Epoch 715 / 2000 - 715 epochs total Iteration 0, loss = 0.0148 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0045 --- Epoch 716 / 2000 - 716 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0020 --- Epoch 717 / 2000 - 717 epochs total Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0057 --- Epoch 718 / 2000 - 718 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0188 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0052 --- Epoch 719 / 2000 - 719 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0027 --- Epoch 720 / 2000 - 720 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0047 --- Epoch 721 / 2000 - 721 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0018 --- Epoch 722 / 2000 - 722 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0081 --- Epoch 723 / 2000 - 723 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0051 --- Epoch 724 / 2000 - 724 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0143 --- Epoch 725 / 2000 - 725 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0027 --- Epoch 726 / 2000 - 726 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0140 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0026 --- Epoch 727 / 2000 - 727 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0219 Iteration 80, loss = 0.0044 --- Epoch 728 / 2000 - 728 epochs total Iteration 0, loss = 0.0120 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0206 --- Epoch 729 / 2000 - 729 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0124 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0067 --- Epoch 730 / 2000 - 730 epochs total Iteration 0, loss = 0.0207 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0064 --- Epoch 731 / 2000 - 731 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0126 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0098 --- Epoch 732 / 2000 - 732 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0165 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0045 --- Epoch 733 / 2000 - 733 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0037 --- Epoch 734 / 2000 - 734 epochs total Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0052 --- Epoch 735 / 2000 - 735 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0055 --- Epoch 736 / 2000 - 736 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0116 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0022 --- Epoch 737 / 2000 - 737 epochs total Iteration 0, loss = 0.0128 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0096 --- Epoch 738 / 2000 - 738 epochs total Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0018 --- Epoch 739 / 2000 - 739 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0148 Iteration 60, loss = 0.0213 Iteration 80, loss = 0.0022 --- Epoch 740 / 2000 - 740 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0067 --- Epoch 741 / 2000 - 741 epochs total Iteration 0, loss = 0.0208 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0081 --- Epoch 742 / 2000 - 742 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0112 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0066 --- Epoch 743 / 2000 - 743 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0370 --- Epoch 744 / 2000 - 744 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0036 --- Epoch 745 / 2000 - 745 epochs total Iteration 0, loss = 0.0146 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0141 Iteration 80, loss = 0.0142 --- Epoch 746 / 2000 - 746 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0299 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0050 --- Epoch 747 / 2000 - 747 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0124 --- Epoch 748 / 2000 - 748 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0031 --- Epoch 749 / 2000 - 749 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0142 --- Epoch 750 / 2000 - 750 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0067 --- Epoch 751 / 2000 - 751 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0057 --- Epoch 752 / 2000 - 752 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0031 --- Epoch 753 / 2000 - 753 epochs total Iteration 0, loss = 0.0148 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0152 --- Epoch 754 / 2000 - 754 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0178 Iteration 60, loss = 0.0007 Iteration 80, loss = 0.0063 --- Epoch 755 / 2000 - 755 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0021 --- Epoch 756 / 2000 - 756 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0056 --- Epoch 757 / 2000 - 757 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0041 --- Epoch 758 / 2000 - 758 epochs total Iteration 0, loss = 0.0302 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0024 --- Epoch 759 / 2000 - 759 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0066 --- Epoch 760 / 2000 - 760 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0159 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0063 --- Epoch 761 / 2000 - 761 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0158 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0042 --- Epoch 762 / 2000 - 762 epochs total Iteration 0, loss = 0.0116 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0042 --- Epoch 763 / 2000 - 763 epochs total Iteration 0, loss = 0.0082 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0028 --- Epoch 764 / 2000 - 764 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0019 --- Epoch 765 / 2000 - 765 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0112 --- Epoch 766 / 2000 - 766 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0034 --- Epoch 767 / 2000 - 767 epochs total Iteration 0, loss = 0.0235 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0026 --- Epoch 768 / 2000 - 768 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0067 --- Epoch 769 / 2000 - 769 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0073 --- Epoch 770 / 2000 - 770 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0014 --- Epoch 771 / 2000 - 771 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0035 --- Epoch 772 / 2000 - 772 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0034 --- Epoch 773 / 2000 - 773 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0030 --- Epoch 774 / 2000 - 774 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0247 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0018 --- Epoch 775 / 2000 - 775 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0042 --- Epoch 776 / 2000 - 776 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0077 --- Epoch 777 / 2000 - 777 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0017 --- Epoch 778 / 2000 - 778 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0179 --- Epoch 779 / 2000 - 779 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0202 --- Epoch 780 / 2000 - 780 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0218 Iteration 80, loss = 0.0078 --- Epoch 781 / 2000 - 781 epochs total Iteration 0, loss = 0.0090 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0035 --- Epoch 782 / 2000 - 782 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0020 --- Epoch 783 / 2000 - 783 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0020 --- Epoch 784 / 2000 - 784 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0042 --- Epoch 785 / 2000 - 785 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0062 --- Epoch 786 / 2000 - 786 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0026 --- Epoch 787 / 2000 - 787 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0067 --- Epoch 788 / 2000 - 788 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0080 --- Epoch 789 / 2000 - 789 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0058 --- Epoch 790 / 2000 - 790 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0123 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0073 --- Epoch 791 / 2000 - 791 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0067 --- Epoch 792 / 2000 - 792 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0074 --- Epoch 793 / 2000 - 793 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0011 --- Epoch 794 / 2000 - 794 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0040 --- Epoch 795 / 2000 - 795 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0063 --- Epoch 796 / 2000 - 796 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0186 --- Epoch 797 / 2000 - 797 epochs total Iteration 0, loss = 0.0070 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0049 --- Epoch 798 / 2000 - 798 epochs total Iteration 0, loss = 0.0136 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0009 Iteration 60, loss = 0.0132 Iteration 80, loss = 0.0045 --- Epoch 799 / 2000 - 799 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0152 --- Epoch 800 / 2000 - 800 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0033 --- Epoch 801 / 2000 - 801 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0037 --- Epoch 802 / 2000 - 802 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0089 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0045 --- Epoch 803 / 2000 - 803 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0087 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0068 --- Epoch 804 / 2000 - 804 epochs total Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0071 --- Epoch 805 / 2000 - 805 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0165 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0115 Iteration 80, loss = 0.0075 --- Epoch 806 / 2000 - 806 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0051 --- Epoch 807 / 2000 - 807 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0019 --- Epoch 808 / 2000 - 808 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0122 --- Epoch 809 / 2000 - 809 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0098 --- Epoch 810 / 2000 - 810 epochs total Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0051 --- Epoch 811 / 2000 - 811 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0121 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0053 --- Epoch 812 / 2000 - 812 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0114 Iteration 80, loss = 0.0071 --- Epoch 813 / 2000 - 813 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0162 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0063 --- Epoch 814 / 2000 - 814 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0130 Iteration 80, loss = 0.0031 --- Epoch 815 / 2000 - 815 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0020 --- Epoch 816 / 2000 - 816 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0062 --- Epoch 817 / 2000 - 817 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0087 --- Epoch 818 / 2000 - 818 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0201 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0053 --- Epoch 819 / 2000 - 819 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0031 --- Epoch 820 / 2000 - 820 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0010 Iteration 80, loss = 0.0031 --- Epoch 821 / 2000 - 821 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0110 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0048 --- Epoch 822 / 2000 - 822 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0027 --- Epoch 823 / 2000 - 823 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0067 --- Epoch 824 / 2000 - 824 epochs total Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0088 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0047 --- Epoch 825 / 2000 - 825 epochs total Iteration 0, loss = 0.0082 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0113 --- Epoch 826 / 2000 - 826 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0030 --- Epoch 827 / 2000 - 827 epochs total Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0008 Iteration 80, loss = 0.0098 --- Epoch 828 / 2000 - 828 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0149 Iteration 40, loss = 0.0602 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0048 --- Epoch 829 / 2000 - 829 epochs total Iteration 0, loss = 0.0170 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0084 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0070 --- Epoch 830 / 2000 - 830 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0059 --- Epoch 831 / 2000 - 831 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0144 Iteration 80, loss = 0.0093 --- Epoch 832 / 2000 - 832 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0113 --- Epoch 833 / 2000 - 833 epochs total Iteration 0, loss = 0.0010 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0183 Iteration 60, loss = 0.0216 Iteration 80, loss = 0.0108 --- Epoch 834 / 2000 - 834 epochs total Iteration 0, loss = 0.0097 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0143 Iteration 80, loss = 0.0025 --- Epoch 835 / 2000 - 835 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0047 --- Epoch 836 / 2000 - 836 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0102 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0045 --- Epoch 837 / 2000 - 837 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0081 --- Epoch 838 / 2000 - 838 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0062 --- Epoch 839 / 2000 - 839 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0033 --- Epoch 840 / 2000 - 840 epochs total Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0020 --- Epoch 841 / 2000 - 841 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0022 --- Epoch 842 / 2000 - 842 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0071 --- Epoch 843 / 2000 - 843 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0204 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0029 --- Epoch 844 / 2000 - 844 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0028 --- Epoch 845 / 2000 - 845 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0105 Iteration 60, loss = 0.0130 Iteration 80, loss = 0.0017 --- Epoch 846 / 2000 - 846 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0145 --- Epoch 847 / 2000 - 847 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0023 --- Epoch 848 / 2000 - 848 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0032 --- Epoch 849 / 2000 - 849 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0049 --- Epoch 850 / 2000 - 850 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0035 --- Epoch 851 / 2000 - 851 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0126 Iteration 80, loss = 0.0138 --- Epoch 852 / 2000 - 852 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0054 --- Epoch 853 / 2000 - 853 epochs total Iteration 0, loss = 0.0010 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0089 Iteration 60, loss = 0.0130 Iteration 80, loss = 0.0035 --- Epoch 854 / 2000 - 854 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0127 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0034 --- Epoch 855 / 2000 - 855 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0102 Iteration 80, loss = 0.0108 --- Epoch 856 / 2000 - 856 epochs total Iteration 0, loss = 0.0103 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0036 --- Epoch 857 / 2000 - 857 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0061 --- Epoch 858 / 2000 - 858 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0070 --- Epoch 859 / 2000 - 859 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0118 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0034 --- Epoch 860 / 2000 - 860 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0018 --- Epoch 861 / 2000 - 861 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0095 --- Epoch 862 / 2000 - 862 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0045 --- Epoch 863 / 2000 - 863 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0101 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0050 --- Epoch 864 / 2000 - 864 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0120 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0048 --- Epoch 865 / 2000 - 865 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0085 --- Epoch 866 / 2000 - 866 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0205 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0077 --- Epoch 867 / 2000 - 867 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0022 --- Epoch 868 / 2000 - 868 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0204 Iteration 80, loss = 0.0031 --- Epoch 869 / 2000 - 869 epochs total Iteration 0, loss = 0.0126 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0136 Iteration 80, loss = 0.0230 --- Epoch 870 / 2000 - 870 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0033 --- Epoch 871 / 2000 - 871 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0014 --- Epoch 872 / 2000 - 872 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0011 --- Epoch 873 / 2000 - 873 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0231 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0030 --- Epoch 874 / 2000 - 874 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0019 --- Epoch 875 / 2000 - 875 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0053 --- Epoch 876 / 2000 - 876 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0020 --- Epoch 877 / 2000 - 877 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0069 --- Epoch 878 / 2000 - 878 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0018 --- Epoch 879 / 2000 - 879 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0228 --- Epoch 880 / 2000 - 880 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0163 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0016 --- Epoch 881 / 2000 - 881 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0763 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0064 --- Epoch 882 / 2000 - 882 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0024 --- Epoch 883 / 2000 - 883 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0082 Iteration 80, loss = 0.0120 --- Epoch 884 / 2000 - 884 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0083 --- Epoch 885 / 2000 - 885 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0088 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0085 --- Epoch 886 / 2000 - 886 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0053 --- Epoch 887 / 2000 - 887 epochs total Iteration 0, loss = 0.0180 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0015 --- Epoch 888 / 2000 - 888 epochs total Iteration 0, loss = 0.0265 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0082 --- Epoch 889 / 2000 - 889 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0272 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0108 --- Epoch 890 / 2000 - 890 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0193 Iteration 80, loss = 0.0013 --- Epoch 891 / 2000 - 891 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0029 --- Epoch 892 / 2000 - 892 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0178 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0042 --- Epoch 893 / 2000 - 893 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0030 --- Epoch 894 / 2000 - 894 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0031 --- Epoch 895 / 2000 - 895 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0160 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0025 --- Epoch 896 / 2000 - 896 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0102 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0044 --- Epoch 897 / 2000 - 897 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0174 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0069 --- Epoch 898 / 2000 - 898 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0039 --- Epoch 899 / 2000 - 899 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0016 --- Epoch 900 / 2000 - 900 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0035 --- Epoch 901 / 2000 - 901 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0014 --- Epoch 902 / 2000 - 902 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0049 --- Epoch 903 / 2000 - 903 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0041 --- Epoch 904 / 2000 - 904 epochs total Iteration 0, loss = 0.0245 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0249 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0033 --- Epoch 905 / 2000 - 905 epochs total Iteration 0, loss = 0.0182 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0156 --- Epoch 906 / 2000 - 906 epochs total Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0033 --- Epoch 907 / 2000 - 907 epochs total Iteration 0, loss = 0.0113 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0021 --- Epoch 908 / 2000 - 908 epochs total Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0153 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0020 --- Epoch 909 / 2000 - 909 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0018 --- Epoch 910 / 2000 - 910 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0017 --- Epoch 911 / 2000 - 911 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0039 --- Epoch 912 / 2000 - 912 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0087 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0042 --- Epoch 913 / 2000 - 913 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0213 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0032 --- Epoch 914 / 2000 - 914 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0060 --- Epoch 915 / 2000 - 915 epochs total Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0037 --- Epoch 916 / 2000 - 916 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0057 --- Epoch 917 / 2000 - 917 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0159 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0036 --- Epoch 918 / 2000 - 918 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0124 --- Epoch 919 / 2000 - 919 epochs total Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0183 Iteration 80, loss = 0.0018 --- Epoch 920 / 2000 - 920 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0029 --- Epoch 921 / 2000 - 921 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0100 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0066 --- Epoch 922 / 2000 - 922 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0018 --- Epoch 923 / 2000 - 923 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0129 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0012 --- Epoch 924 / 2000 - 924 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0102 --- Epoch 925 / 2000 - 925 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0040 --- Epoch 926 / 2000 - 926 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0050 --- Epoch 927 / 2000 - 927 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0100 --- Epoch 928 / 2000 - 928 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0035 --- Epoch 929 / 2000 - 929 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0031 --- Epoch 930 / 2000 - 930 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0009 Iteration 80, loss = 0.0015 --- Epoch 931 / 2000 - 931 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0091 --- Epoch 932 / 2000 - 932 epochs total Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0024 --- Epoch 933 / 2000 - 933 epochs total Iteration 0, loss = 0.0201 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0039 --- Epoch 934 / 2000 - 934 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0131 --- Epoch 935 / 2000 - 935 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0023 --- Epoch 936 / 2000 - 936 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0031 --- Epoch 937 / 2000 - 937 epochs total Iteration 0, loss = 0.0178 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0095 --- Epoch 938 / 2000 - 938 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0129 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0028 --- Epoch 939 / 2000 - 939 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0016 --- Epoch 940 / 2000 - 940 epochs total Iteration 0, loss = 0.0186 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0140 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0013 --- Epoch 941 / 2000 - 941 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0049 --- Epoch 942 / 2000 - 942 epochs total Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0024 --- Epoch 943 / 2000 - 943 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0085 --- Epoch 944 / 2000 - 944 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0189 Iteration 60, loss = 0.0325 Iteration 80, loss = 0.0051 --- Epoch 945 / 2000 - 945 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0053 --- Epoch 946 / 2000 - 946 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0231 Iteration 80, loss = 0.0047 --- Epoch 947 / 2000 - 947 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0164 --- Epoch 948 / 2000 - 948 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0012 --- Epoch 949 / 2000 - 949 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0041 --- Epoch 950 / 2000 - 950 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0041 --- Epoch 951 / 2000 - 951 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0029 --- Epoch 952 / 2000 - 952 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0190 --- Epoch 953 / 2000 - 953 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0091 --- Epoch 954 / 2000 - 954 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0033 --- Epoch 955 / 2000 - 955 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0082 Iteration 80, loss = 0.0008 --- Epoch 956 / 2000 - 956 epochs total Iteration 0, loss = 0.0310 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0037 --- Epoch 957 / 2000 - 957 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0033 --- Epoch 958 / 2000 - 958 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0050 --- Epoch 959 / 2000 - 959 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0059 --- Epoch 960 / 2000 - 960 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0137 Iteration 40, loss = 0.0089 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0029 --- Epoch 961 / 2000 - 961 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0175 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0015 --- Epoch 962 / 2000 - 962 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0021 --- Epoch 963 / 2000 - 963 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0135 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0035 --- Epoch 964 / 2000 - 964 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0118 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0019 --- Epoch 965 / 2000 - 965 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0028 --- Epoch 966 / 2000 - 966 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0071 --- Epoch 967 / 2000 - 967 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0078 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0022 --- Epoch 968 / 2000 - 968 epochs total Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0013 --- Epoch 969 / 2000 - 969 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0021 --- Epoch 970 / 2000 - 970 epochs total Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0233 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0037 --- Epoch 971 / 2000 - 971 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0020 --- Epoch 972 / 2000 - 972 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0033 --- Epoch 973 / 2000 - 973 epochs total Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0077 --- Epoch 974 / 2000 - 974 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0287 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0027 --- Epoch 975 / 2000 - 975 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0194 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0153 --- Epoch 976 / 2000 - 976 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0026 --- Epoch 977 / 2000 - 977 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0063 --- Epoch 978 / 2000 - 978 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0087 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0298 --- Epoch 979 / 2000 - 979 epochs total Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0090 --- Epoch 980 / 2000 - 980 epochs total Iteration 0, loss = 0.0133 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0233 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0028 --- Epoch 981 / 2000 - 981 epochs total Iteration 0, loss = 0.0147 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0082 Iteration 80, loss = 0.0014 --- Epoch 982 / 2000 - 982 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0051 --- Epoch 983 / 2000 - 983 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0012 --- Epoch 984 / 2000 - 984 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0134 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0014 --- Epoch 985 / 2000 - 985 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0226 Iteration 40, loss = 0.0113 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0027 --- Epoch 986 / 2000 - 986 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0013 --- Epoch 987 / 2000 - 987 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0051 --- Epoch 988 / 2000 - 988 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0087 --- Epoch 989 / 2000 - 989 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0020 --- Epoch 990 / 2000 - 990 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0053 --- Epoch 991 / 2000 - 991 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0182 --- Epoch 992 / 2000 - 992 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0027 --- Epoch 993 / 2000 - 993 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0017 --- Epoch 994 / 2000 - 994 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0250 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0019 --- Epoch 995 / 2000 - 995 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0012 --- Epoch 996 / 2000 - 996 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0044 --- Epoch 997 / 2000 - 997 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0201 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0054 --- Epoch 998 / 2000 - 998 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0032 --- Epoch 999 / 2000 - 999 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0098 --- Epoch 1000 / 2000 - 1000 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0112 --- Epoch 1001 / 2000 - 1001 epochs total Iteration 0, loss = 0.0215 Iteration 20, loss = 0.0017
--------------------------------------------------------------------------- KeyboardInterrupt Traceback (most recent call last) <ipython-input-117-e83bcd8f9b5f> in <module> ----> 1 train(model9, optimizer, epochs=2000, x_train=data["X_train_ship"], y_train=data["y_train_ship"], criterion=nn.MSELoss()) <ipython-input-18-95dee9c67ab2> in train(model, optimizer, epochs, x_train, y_train, criterion) 28 y = y_batch[t].to(device=device, dtype=dtype) 29 ---> 30 scores = model(x) 31 32 loss = criterion(scores.view(-1), y.view(-1)) /opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/module.py in _call_impl(self, *input, **kwargs) 720 result = self._slow_forward(*input, **kwargs) 721 else: --> 722 result = self.forward(*input, **kwargs) 723 for hook in itertools.chain( 724 _global_forward_hooks.values(), <ipython-input-24-48b049d402e0> in forward(self, x) 25 26 # Encoder ---> 27 scores = F.relu(self.batchnorm1(self.conv1(x))) 28 scores = F.relu(self.batchnorm2(self.conv2(scores))) 29 scores = F.relu(self.batchnorm3(self.conv3(scores))) /opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/module.py in _call_impl(self, *input, **kwargs) 720 result = self._slow_forward(*input, **kwargs) 721 else: --> 722 result = self.forward(*input, **kwargs) 723 for hook in itertools.chain( 724 _global_forward_hooks.values(), /opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/conv.py in forward(self, input) 417 418 def forward(self, input: Tensor) -> Tensor: --> 419 return self._conv_forward(input, self.weight) 420 421 class Conv3d(_ConvNd): /opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/conv.py in _conv_forward(self, input, weight) 414 _pair(0), self.dilation, self.groups) 415 return F.conv2d(input, weight, self.bias, self.stride, --> 416 self.padding, self.dilation, self.groups) 417 418 def forward(self, input: Tensor) -> Tensor: KeyboardInterrupt:
testModel(model9, x_test=data["X_test_ship"], y_test=data["y_test_ship"], criterion=nn.MSELoss())
learning_rate = 1e-2
model11 = ConvNet4()
optimizer = optim.SGD(model11.parameters(), lr=learning_rate)
train(model11, optimizer, epochs=419, x_train=data["X_train_frog"], y_train=data["y_train_frog"], criterion=nn.MSELoss())
--- Epoch 1 / 419 - 2582 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0089 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0044 --- Epoch 2 / 419 - 2583 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0045 --- Epoch 3 / 419 - 2584 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0018 --- Epoch 4 / 419 - 2585 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0158 Iteration 80, loss = 0.0029 --- Epoch 5 / 419 - 2586 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0011 Iteration 80, loss = 0.0019 --- Epoch 6 / 419 - 2587 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0066 --- Epoch 7 / 419 - 2588 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0035 --- Epoch 8 / 419 - 2589 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0025 --- Epoch 9 / 419 - 2590 epochs total Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0027 --- Epoch 10 / 419 - 2591 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0013 --- Epoch 11 / 419 - 2592 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0020 --- Epoch 12 / 419 - 2593 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0032 --- Epoch 13 / 419 - 2594 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0065 --- Epoch 14 / 419 - 2595 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0040 --- Epoch 15 / 419 - 2596 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0019 --- Epoch 16 / 419 - 2597 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0033 --- Epoch 17 / 419 - 2598 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0070 --- Epoch 18 / 419 - 2599 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0041 --- Epoch 19 / 419 - 2600 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0147 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0026 --- Epoch 20 / 419 - 2601 epochs total Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0023 --- Epoch 21 / 419 - 2602 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0067 --- Epoch 22 / 419 - 2603 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0070 --- Epoch 23 / 419 - 2604 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0208 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0016 --- Epoch 24 / 419 - 2605 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0038 --- Epoch 25 / 419 - 2606 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0044 --- Epoch 26 / 419 - 2607 epochs total Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0020 --- Epoch 27 / 419 - 2608 epochs total Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0015 --- Epoch 28 / 419 - 2609 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0057 --- Epoch 29 / 419 - 2610 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0029 --- Epoch 30 / 419 - 2611 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0267 --- Epoch 31 / 419 - 2612 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0092 --- Epoch 32 / 419 - 2613 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0033 --- Epoch 33 / 419 - 2614 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0108 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0043 --- Epoch 34 / 419 - 2615 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0030 --- Epoch 35 / 419 - 2616 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0033 --- Epoch 36 / 419 - 2617 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0016 --- Epoch 37 / 419 - 2618 epochs total Iteration 0, loss = 0.0126 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0506 Iteration 80, loss = 0.0043 --- Epoch 38 / 419 - 2619 epochs total Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0068 --- Epoch 39 / 419 - 2620 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0036 --- Epoch 40 / 419 - 2621 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0021 --- Epoch 41 / 419 - 2622 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0024 --- Epoch 42 / 419 - 2623 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0130 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0022 --- Epoch 43 / 419 - 2624 epochs total Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0181 --- Epoch 44 / 419 - 2625 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0040 --- Epoch 45 / 419 - 2626 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0015 --- Epoch 46 / 419 - 2627 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0055 --- Epoch 47 / 419 - 2628 epochs total Iteration 0, loss = 0.0113 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0061 --- Epoch 48 / 419 - 2629 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0063
--------------------------------------------------------------------------- KeyboardInterrupt Traceback (most recent call last) <ipython-input-130-3d0cbeabd450> in <module> ----> 1 train(model11, optimizer, epochs=419, x_train=data["X_train_frog"], y_train=data["y_train_frog"], criterion=nn.MSELoss()) <ipython-input-18-95dee9c67ab2> in train(model, optimizer, epochs, x_train, y_train, criterion) 28 y = y_batch[t].to(device=device, dtype=dtype) 29 ---> 30 scores = model(x) 31 32 loss = criterion(scores.view(-1), y.view(-1)) /opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/module.py in _call_impl(self, *input, **kwargs) 720 result = self._slow_forward(*input, **kwargs) 721 else: --> 722 result = self.forward(*input, **kwargs) 723 for hook in itertools.chain( 724 _global_forward_hooks.values(), <ipython-input-24-48b049d402e0> in forward(self, x) 26 # Encoder 27 scores = F.relu(self.batchnorm1(self.conv1(x))) ---> 28 scores = F.relu(self.batchnorm2(self.conv2(scores))) 29 scores = F.relu(self.batchnorm3(self.conv3(scores))) 30 scores = F.relu(self.batchnorm4(self.conv4(scores))) /opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/module.py in _call_impl(self, *input, **kwargs) 720 result = self._slow_forward(*input, **kwargs) 721 else: --> 722 result = self.forward(*input, **kwargs) 723 for hook in itertools.chain( 724 _global_forward_hooks.values(), /opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/modules/batchnorm.py in forward(self, input) 134 self.running_mean if not self.training or self.track_running_stats else None, 135 self.running_var if not self.training or self.track_running_stats else None, --> 136 self.weight, self.bias, bn_training, exponential_average_factor, self.eps) 137 138 /opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/nn/functional.py in batch_norm(input, running_mean, running_var, weight, bias, training, momentum, eps) 2014 return torch.batch_norm( 2015 input, weight, bias, running_mean, running_var, -> 2016 training, momentum, eps, torch.backends.cudnn.enabled 2017 ) 2018 KeyboardInterrupt:
testModel(model11, x_test=data["X_test_frog"], y_test=data["y_test_frog"], criterion=nn.L1Loss())
learning_rate = 1e-2
model12 = ConvNet4()
optimizer = optim.SGD(model12.parameters(), lr=learning_rate)
train(model12, optimizer, epochs=1506, x_train=data["X_train_horse"], y_train=data["y_train_horse"], criterion=nn.MSELoss())
--- Epoch 1 / 1506 - 1495 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0085 --- Epoch 2 / 1506 - 1496 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0085 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0037 --- Epoch 3 / 1506 - 1497 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0160 Iteration 80, loss = 0.0053 --- Epoch 4 / 1506 - 1498 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0053 --- Epoch 5 / 1506 - 1499 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0034 --- Epoch 6 / 1506 - 1500 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0033 --- Epoch 7 / 1506 - 1501 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0041 --- Epoch 8 / 1506 - 1502 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0042 --- Epoch 9 / 1506 - 1503 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0051 --- Epoch 10 / 1506 - 1504 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0025 --- Epoch 11 / 1506 - 1505 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0065 --- Epoch 12 / 1506 - 1506 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0022 --- Epoch 13 / 1506 - 1507 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0027 --- Epoch 14 / 1506 - 1508 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0026 --- Epoch 15 / 1506 - 1509 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0080 --- Epoch 16 / 1506 - 1510 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0054 --- Epoch 17 / 1506 - 1511 epochs total Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0030 --- Epoch 18 / 1506 - 1512 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0176 --- Epoch 19 / 1506 - 1513 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0054 --- Epoch 20 / 1506 - 1514 epochs total Iteration 0, loss = 0.0139 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0027 --- Epoch 21 / 1506 - 1515 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0221 Iteration 80, loss = 0.0028 --- Epoch 22 / 1506 - 1516 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0093 --- Epoch 23 / 1506 - 1517 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0032 --- Epoch 24 / 1506 - 1518 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0339 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0041 --- Epoch 25 / 1506 - 1519 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0029 --- Epoch 26 / 1506 - 1520 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0028 --- Epoch 27 / 1506 - 1521 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0034 --- Epoch 28 / 1506 - 1522 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0068 --- Epoch 29 / 1506 - 1523 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0051 --- Epoch 30 / 1506 - 1524 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0031 --- Epoch 31 / 1506 - 1525 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0020 --- Epoch 32 / 1506 - 1526 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0066 --- Epoch 33 / 1506 - 1527 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0074 --- Epoch 34 / 1506 - 1528 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0035 --- Epoch 35 / 1506 - 1529 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0025 --- Epoch 36 / 1506 - 1530 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0082 Iteration 80, loss = 0.0050 --- Epoch 37 / 1506 - 1531 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0032 --- Epoch 38 / 1506 - 1532 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0034 --- Epoch 39 / 1506 - 1533 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0047 --- Epoch 40 / 1506 - 1534 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0141 --- Epoch 41 / 1506 - 1535 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0020 --- Epoch 42 / 1506 - 1536 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0036 --- Epoch 43 / 1506 - 1537 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0053 --- Epoch 44 / 1506 - 1538 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0077 --- Epoch 45 / 1506 - 1539 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0109 --- Epoch 46 / 1506 - 1540 epochs total Iteration 0, loss = 0.0169 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0034 --- Epoch 47 / 1506 - 1541 epochs total Iteration 0, loss = 0.0194 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0026 --- Epoch 48 / 1506 - 1542 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0026 --- Epoch 49 / 1506 - 1543 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0025 --- Epoch 50 / 1506 - 1544 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0226 --- Epoch 51 / 1506 - 1545 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0097 --- Epoch 52 / 1506 - 1546 epochs total Iteration 0, loss = 0.0109 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0133 Iteration 80, loss = 0.0039 --- Epoch 53 / 1506 - 1547 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0016 --- Epoch 54 / 1506 - 1548 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0128 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0061 --- Epoch 55 / 1506 - 1549 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0039 --- Epoch 56 / 1506 - 1550 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0148 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0050 --- Epoch 57 / 1506 - 1551 epochs total Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0088 --- Epoch 58 / 1506 - 1552 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0029 --- Epoch 59 / 1506 - 1553 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0064 --- Epoch 60 / 1506 - 1554 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0172 --- Epoch 61 / 1506 - 1555 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0069 --- Epoch 62 / 1506 - 1556 epochs total Iteration 0, loss = 0.0085 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0040 --- Epoch 63 / 1506 - 1557 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0148 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0046 --- Epoch 64 / 1506 - 1558 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0024 --- Epoch 65 / 1506 - 1559 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0022 --- Epoch 66 / 1506 - 1560 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0043 --- Epoch 67 / 1506 - 1561 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0090 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0086 --- Epoch 68 / 1506 - 1562 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0039 --- Epoch 69 / 1506 - 1563 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0035 --- Epoch 70 / 1506 - 1564 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0084 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0017 --- Epoch 71 / 1506 - 1565 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0026 --- Epoch 72 / 1506 - 1566 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0038 --- Epoch 73 / 1506 - 1567 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0059 --- Epoch 74 / 1506 - 1568 epochs total Iteration 0, loss = 0.0010 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0085 Iteration 80, loss = 0.0026 --- Epoch 75 / 1506 - 1569 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0041 --- Epoch 76 / 1506 - 1570 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0028 --- Epoch 77 / 1506 - 1571 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0224 --- Epoch 78 / 1506 - 1572 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0059 --- Epoch 79 / 1506 - 1573 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0035 --- Epoch 80 / 1506 - 1574 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0070 --- Epoch 81 / 1506 - 1575 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0141 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0049 --- Epoch 82 / 1506 - 1576 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0021 --- Epoch 83 / 1506 - 1577 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0042 --- Epoch 84 / 1506 - 1578 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0035 --- Epoch 85 / 1506 - 1579 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0022 --- Epoch 86 / 1506 - 1580 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0097 --- Epoch 87 / 1506 - 1581 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0096 Iteration 80, loss = 0.0023 --- Epoch 88 / 1506 - 1582 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0019 --- Epoch 89 / 1506 - 1583 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0051 --- Epoch 90 / 1506 - 1584 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0027 --- Epoch 91 / 1506 - 1585 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0018 --- Epoch 92 / 1506 - 1586 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0052 --- Epoch 93 / 1506 - 1587 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0040 --- Epoch 94 / 1506 - 1588 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0037 --- Epoch 95 / 1506 - 1589 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0028 --- Epoch 96 / 1506 - 1590 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0044 --- Epoch 97 / 1506 - 1591 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0028 --- Epoch 98 / 1506 - 1592 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0028 --- Epoch 99 / 1506 - 1593 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0056 --- Epoch 100 / 1506 - 1594 epochs total Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0022 --- Epoch 101 / 1506 - 1595 epochs total Iteration 0, loss = 0.0170 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0041 --- Epoch 102 / 1506 - 1596 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0062 --- Epoch 103 / 1506 - 1597 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0038 --- Epoch 104 / 1506 - 1598 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0056 --- Epoch 105 / 1506 - 1599 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0078 --- Epoch 106 / 1506 - 1600 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0047 --- Epoch 107 / 1506 - 1601 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0044 --- Epoch 108 / 1506 - 1602 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0031 --- Epoch 109 / 1506 - 1603 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0027 --- Epoch 110 / 1506 - 1604 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0037 --- Epoch 111 / 1506 - 1605 epochs total Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0017 --- Epoch 112 / 1506 - 1606 epochs total Iteration 0, loss = 0.0070 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0339 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0078 --- Epoch 113 / 1506 - 1607 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0038 --- Epoch 114 / 1506 - 1608 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0049 --- Epoch 115 / 1506 - 1609 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0123 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0033 --- Epoch 116 / 1506 - 1610 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0022 --- Epoch 117 / 1506 - 1611 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0024 --- Epoch 118 / 1506 - 1612 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0083 --- Epoch 119 / 1506 - 1613 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0030 --- Epoch 120 / 1506 - 1614 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0140 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0033 --- Epoch 121 / 1506 - 1615 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0033 --- Epoch 122 / 1506 - 1616 epochs total Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0036 --- Epoch 123 / 1506 - 1617 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0059 --- Epoch 124 / 1506 - 1618 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0117 --- Epoch 125 / 1506 - 1619 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0148 --- Epoch 126 / 1506 - 1620 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0100 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0034 --- Epoch 127 / 1506 - 1621 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0060 --- Epoch 128 / 1506 - 1622 epochs total Iteration 0, loss = 0.0223 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0026 --- Epoch 129 / 1506 - 1623 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0131 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0031 --- Epoch 130 / 1506 - 1624 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0124 Iteration 80, loss = 0.0028 --- Epoch 131 / 1506 - 1625 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0066 --- Epoch 132 / 1506 - 1626 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0027 --- Epoch 133 / 1506 - 1627 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0060 --- Epoch 134 / 1506 - 1628 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0041 --- Epoch 135 / 1506 - 1629 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0028 --- Epoch 136 / 1506 - 1630 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0052 --- Epoch 137 / 1506 - 1631 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0049 --- Epoch 138 / 1506 - 1632 epochs total Iteration 0, loss = 0.0135 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0154 --- Epoch 139 / 1506 - 1633 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0032 --- Epoch 140 / 1506 - 1634 epochs total Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0023 --- Epoch 141 / 1506 - 1635 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0058 --- Epoch 142 / 1506 - 1636 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0024 --- Epoch 143 / 1506 - 1637 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0024 --- Epoch 144 / 1506 - 1638 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0088 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0011 --- Epoch 145 / 1506 - 1639 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0019 --- Epoch 146 / 1506 - 1640 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0083 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0040 --- Epoch 147 / 1506 - 1641 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0057 --- Epoch 148 / 1506 - 1642 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0069 --- Epoch 149 / 1506 - 1643 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0039 --- Epoch 150 / 1506 - 1644 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0035 --- Epoch 151 / 1506 - 1645 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0124 --- Epoch 152 / 1506 - 1646 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0018 --- Epoch 153 / 1506 - 1647 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0042 --- Epoch 154 / 1506 - 1648 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0085 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0044 --- Epoch 155 / 1506 - 1649 epochs total Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0032 --- Epoch 156 / 1506 - 1650 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0037 --- Epoch 157 / 1506 - 1651 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0043 --- Epoch 158 / 1506 - 1652 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0049 --- Epoch 159 / 1506 - 1653 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0038 --- Epoch 160 / 1506 - 1654 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0035 --- Epoch 161 / 1506 - 1655 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0040 --- Epoch 162 / 1506 - 1656 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0088 --- Epoch 163 / 1506 - 1657 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0064 --- Epoch 164 / 1506 - 1658 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0035 --- Epoch 165 / 1506 - 1659 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0080 --- Epoch 166 / 1506 - 1660 epochs total Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0032 --- Epoch 167 / 1506 - 1661 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0021 --- Epoch 168 / 1506 - 1662 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0052 --- Epoch 169 / 1506 - 1663 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0053 --- Epoch 170 / 1506 - 1664 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0090 --- Epoch 171 / 1506 - 1665 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0028 --- Epoch 172 / 1506 - 1666 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0039 --- Epoch 173 / 1506 - 1667 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0114 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0038 --- Epoch 174 / 1506 - 1668 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0082 --- Epoch 175 / 1506 - 1669 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0044 --- Epoch 176 / 1506 - 1670 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0191 --- Epoch 177 / 1506 - 1671 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0020 --- Epoch 178 / 1506 - 1672 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0143 Iteration 80, loss = 0.0026 --- Epoch 179 / 1506 - 1673 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0156 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0022 --- Epoch 180 / 1506 - 1674 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0053 --- Epoch 181 / 1506 - 1675 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0024 --- Epoch 182 / 1506 - 1676 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0035 --- Epoch 183 / 1506 - 1677 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0096 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0049 --- Epoch 184 / 1506 - 1678 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0069 --- Epoch 185 / 1506 - 1679 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0031 --- Epoch 186 / 1506 - 1680 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0050 --- Epoch 187 / 1506 - 1681 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0156 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0041 --- Epoch 188 / 1506 - 1682 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0044 --- Epoch 189 / 1506 - 1683 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0127 --- Epoch 190 / 1506 - 1684 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0111 --- Epoch 191 / 1506 - 1685 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0037 --- Epoch 192 / 1506 - 1686 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0138 Iteration 80, loss = 0.0090 --- Epoch 193 / 1506 - 1687 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0131 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0026 --- Epoch 194 / 1506 - 1688 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0024 --- Epoch 195 / 1506 - 1689 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0037 --- Epoch 196 / 1506 - 1690 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0026 --- Epoch 197 / 1506 - 1691 epochs total Iteration 0, loss = 0.0284 Iteration 20, loss = 0.0129 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0036 --- Epoch 198 / 1506 - 1692 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0082 Iteration 80, loss = 0.0036 --- Epoch 199 / 1506 - 1693 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0020 --- Epoch 200 / 1506 - 1694 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0033 --- Epoch 201 / 1506 - 1695 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0156 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0040 --- Epoch 202 / 1506 - 1696 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0040 --- Epoch 203 / 1506 - 1697 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0129 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0019 --- Epoch 204 / 1506 - 1698 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0049 --- Epoch 205 / 1506 - 1699 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0042 --- Epoch 206 / 1506 - 1700 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0053 --- Epoch 207 / 1506 - 1701 epochs total Iteration 0, loss = 0.0284 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0042 --- Epoch 208 / 1506 - 1702 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0042 --- Epoch 209 / 1506 - 1703 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0034 --- Epoch 210 / 1506 - 1704 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0027 --- Epoch 211 / 1506 - 1705 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0044 --- Epoch 212 / 1506 - 1706 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0124 --- Epoch 213 / 1506 - 1707 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0146 Iteration 80, loss = 0.0032 --- Epoch 214 / 1506 - 1708 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0098 --- Epoch 215 / 1506 - 1709 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0025 --- Epoch 216 / 1506 - 1710 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0032 --- Epoch 217 / 1506 - 1711 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0032 --- Epoch 218 / 1506 - 1712 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0025 --- Epoch 219 / 1506 - 1713 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0010 --- Epoch 220 / 1506 - 1714 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0031 --- Epoch 221 / 1506 - 1715 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0106 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0047 --- Epoch 222 / 1506 - 1716 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0042 --- Epoch 223 / 1506 - 1717 epochs total Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0060 --- Epoch 224 / 1506 - 1718 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0053 --- Epoch 225 / 1506 - 1719 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0044 --- Epoch 226 / 1506 - 1720 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0076 --- Epoch 227 / 1506 - 1721 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0068 --- Epoch 228 / 1506 - 1722 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0032 --- Epoch 229 / 1506 - 1723 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0176 --- Epoch 230 / 1506 - 1724 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0030 --- Epoch 231 / 1506 - 1725 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0020 --- Epoch 232 / 1506 - 1726 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0061 --- Epoch 233 / 1506 - 1727 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0037 --- Epoch 234 / 1506 - 1728 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0021 --- Epoch 235 / 1506 - 1729 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0091 --- Epoch 236 / 1506 - 1730 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0145 Iteration 80, loss = 0.0064 --- Epoch 237 / 1506 - 1731 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0107 --- Epoch 238 / 1506 - 1732 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0098 --- Epoch 239 / 1506 - 1733 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0023 --- Epoch 240 / 1506 - 1734 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0024 --- Epoch 241 / 1506 - 1735 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0096 Iteration 80, loss = 0.0050 --- Epoch 242 / 1506 - 1736 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0086 --- Epoch 243 / 1506 - 1737 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0021 --- Epoch 244 / 1506 - 1738 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0176 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0099 --- Epoch 245 / 1506 - 1739 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0029 --- Epoch 246 / 1506 - 1740 epochs total Iteration 0, loss = 0.0153 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0024 --- Epoch 247 / 1506 - 1741 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0042 --- Epoch 248 / 1506 - 1742 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0028 --- Epoch 249 / 1506 - 1743 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0138 --- Epoch 250 / 1506 - 1744 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0028 --- Epoch 251 / 1506 - 1745 epochs total Iteration 0, loss = 0.0083 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0079 --- Epoch 252 / 1506 - 1746 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0102 Iteration 80, loss = 0.0032 --- Epoch 253 / 1506 - 1747 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0043 --- Epoch 254 / 1506 - 1748 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0039 --- Epoch 255 / 1506 - 1749 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0066 --- Epoch 256 / 1506 - 1750 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0021 --- Epoch 257 / 1506 - 1751 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0036 --- Epoch 258 / 1506 - 1752 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0178 Iteration 80, loss = 0.0057 --- Epoch 259 / 1506 - 1753 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0135 Iteration 80, loss = 0.0057 --- Epoch 260 / 1506 - 1754 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0054 --- Epoch 261 / 1506 - 1755 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0193 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0069 --- Epoch 262 / 1506 - 1756 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0061 --- Epoch 263 / 1506 - 1757 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0018 --- Epoch 264 / 1506 - 1758 epochs total Iteration 0, loss = 0.0127 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0040 --- Epoch 265 / 1506 - 1759 epochs total Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0024 --- Epoch 266 / 1506 - 1760 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0050 --- Epoch 267 / 1506 - 1761 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0141 Iteration 80, loss = 0.0049 --- Epoch 268 / 1506 - 1762 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0023 --- Epoch 269 / 1506 - 1763 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0035 --- Epoch 270 / 1506 - 1764 epochs total Iteration 0, loss = 0.0148 Iteration 20, loss = 0.0180 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0019 --- Epoch 271 / 1506 - 1765 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0039 --- Epoch 272 / 1506 - 1766 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0031 --- Epoch 273 / 1506 - 1767 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0046 --- Epoch 274 / 1506 - 1768 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0191 Iteration 80, loss = 0.0017 --- Epoch 275 / 1506 - 1769 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0034 --- Epoch 276 / 1506 - 1770 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0037 --- Epoch 277 / 1506 - 1771 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0254 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0023 --- Epoch 278 / 1506 - 1772 epochs total Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0230 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0057 --- Epoch 279 / 1506 - 1773 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0034 --- Epoch 280 / 1506 - 1774 epochs total Iteration 0, loss = 0.0085 Iteration 20, loss = 0.0137 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0041 --- Epoch 281 / 1506 - 1775 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0164 Iteration 80, loss = 0.0050 --- Epoch 282 / 1506 - 1776 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0028 --- Epoch 283 / 1506 - 1777 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0054 --- Epoch 284 / 1506 - 1778 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0040 --- Epoch 285 / 1506 - 1779 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0338 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0044 --- Epoch 286 / 1506 - 1780 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0011 --- Epoch 287 / 1506 - 1781 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0035 --- Epoch 288 / 1506 - 1782 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0059 --- Epoch 289 / 1506 - 1783 epochs total Iteration 0, loss = 0.0010 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0072 --- Epoch 290 / 1506 - 1784 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0089 --- Epoch 291 / 1506 - 1785 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0194 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0045 --- Epoch 292 / 1506 - 1786 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0179 --- Epoch 293 / 1506 - 1787 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0048 --- Epoch 294 / 1506 - 1788 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0101 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0040 --- Epoch 295 / 1506 - 1789 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0031 --- Epoch 296 / 1506 - 1790 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0078 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0024 --- Epoch 297 / 1506 - 1791 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0023 --- Epoch 298 / 1506 - 1792 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0053 --- Epoch 299 / 1506 - 1793 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0040 --- Epoch 300 / 1506 - 1794 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0028 --- Epoch 301 / 1506 - 1795 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0047 --- Epoch 302 / 1506 - 1796 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0055 --- Epoch 303 / 1506 - 1797 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0022 --- Epoch 304 / 1506 - 1798 epochs total Iteration 0, loss = 0.0083 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0034 --- Epoch 305 / 1506 - 1799 epochs total Iteration 0, loss = 0.0083 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0032 --- Epoch 306 / 1506 - 1800 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0020 --- Epoch 307 / 1506 - 1801 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0037 --- Epoch 308 / 1506 - 1802 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0156 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0031 --- Epoch 309 / 1506 - 1803 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0036 --- Epoch 310 / 1506 - 1804 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0028 --- Epoch 311 / 1506 - 1805 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0017 --- Epoch 312 / 1506 - 1806 epochs total Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0024 --- Epoch 313 / 1506 - 1807 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0085 Iteration 80, loss = 0.0029 --- Epoch 314 / 1506 - 1808 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0042 --- Epoch 315 / 1506 - 1809 epochs total Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0043 --- Epoch 316 / 1506 - 1810 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0044 --- Epoch 317 / 1506 - 1811 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0088 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0038 --- Epoch 318 / 1506 - 1812 epochs total Iteration 0, loss = 0.0082 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0040 --- Epoch 319 / 1506 - 1813 epochs total Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0052 --- Epoch 320 / 1506 - 1814 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0036 --- Epoch 321 / 1506 - 1815 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0253 Iteration 80, loss = 0.0082 --- Epoch 322 / 1506 - 1816 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0068 --- Epoch 323 / 1506 - 1817 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0020 --- Epoch 324 / 1506 - 1818 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0014 --- Epoch 325 / 1506 - 1819 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0032 --- Epoch 326 / 1506 - 1820 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0079 --- Epoch 327 / 1506 - 1821 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0024 --- Epoch 328 / 1506 - 1822 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0043 --- Epoch 329 / 1506 - 1823 epochs total Iteration 0, loss = 0.0284 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0024 --- Epoch 330 / 1506 - 1824 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0020 --- Epoch 331 / 1506 - 1825 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0052 --- Epoch 332 / 1506 - 1826 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0021 --- Epoch 333 / 1506 - 1827 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0027 --- Epoch 334 / 1506 - 1828 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0032 --- Epoch 335 / 1506 - 1829 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0016 --- Epoch 336 / 1506 - 1830 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0044 --- Epoch 337 / 1506 - 1831 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0026 --- Epoch 338 / 1506 - 1832 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0035 --- Epoch 339 / 1506 - 1833 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0041 --- Epoch 340 / 1506 - 1834 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0022 --- Epoch 341 / 1506 - 1835 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0041 --- Epoch 342 / 1506 - 1836 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0029 --- Epoch 343 / 1506 - 1837 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0063 --- Epoch 344 / 1506 - 1838 epochs total Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0033 --- Epoch 345 / 1506 - 1839 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0284 Iteration 60, loss = 0.0133 Iteration 80, loss = 0.0060 --- Epoch 346 / 1506 - 1840 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0061 --- Epoch 347 / 1506 - 1841 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0112 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0036 --- Epoch 348 / 1506 - 1842 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0141 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0114 --- Epoch 349 / 1506 - 1843 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0036 --- Epoch 350 / 1506 - 1844 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0140 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0311 --- Epoch 351 / 1506 - 1845 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0014 --- Epoch 352 / 1506 - 1846 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0108 --- Epoch 353 / 1506 - 1847 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0120 --- Epoch 354 / 1506 - 1848 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0060 --- Epoch 355 / 1506 - 1849 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0088 --- Epoch 356 / 1506 - 1850 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0152 Iteration 80, loss = 0.0029 --- Epoch 357 / 1506 - 1851 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0039 --- Epoch 358 / 1506 - 1852 epochs total Iteration 0, loss = 0.0281 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0024 --- Epoch 359 / 1506 - 1853 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0099 --- Epoch 360 / 1506 - 1854 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0018 --- Epoch 361 / 1506 - 1855 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0018 --- Epoch 362 / 1506 - 1856 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0027 --- Epoch 363 / 1506 - 1857 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0032 --- Epoch 364 / 1506 - 1858 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0037 --- Epoch 365 / 1506 - 1859 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0051 --- Epoch 366 / 1506 - 1860 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0080 --- Epoch 367 / 1506 - 1861 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0046 --- Epoch 368 / 1506 - 1862 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0042 --- Epoch 369 / 1506 - 1863 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0152 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0025 --- Epoch 370 / 1506 - 1864 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0108 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0036 --- Epoch 371 / 1506 - 1865 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0072 --- Epoch 372 / 1506 - 1866 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0013 --- Epoch 373 / 1506 - 1867 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0081 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0015 --- Epoch 374 / 1506 - 1868 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0066 --- Epoch 375 / 1506 - 1869 epochs total Iteration 0, loss = 0.0085 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0024 --- Epoch 376 / 1506 - 1870 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0230 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0042 --- Epoch 377 / 1506 - 1871 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0010 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0021 --- Epoch 378 / 1506 - 1872 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0010 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0035 --- Epoch 379 / 1506 - 1873 epochs total Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0092 --- Epoch 380 / 1506 - 1874 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0104 --- Epoch 381 / 1506 - 1875 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0106 --- Epoch 382 / 1506 - 1876 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0026 --- Epoch 383 / 1506 - 1877 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0112 --- Epoch 384 / 1506 - 1878 epochs total Iteration 0, loss = 0.0070 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0048 --- Epoch 385 / 1506 - 1879 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0028 --- Epoch 386 / 1506 - 1880 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0088 --- Epoch 387 / 1506 - 1881 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0054 --- Epoch 388 / 1506 - 1882 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0050 --- Epoch 389 / 1506 - 1883 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0039 --- Epoch 390 / 1506 - 1884 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0184 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0033 --- Epoch 391 / 1506 - 1885 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0049 --- Epoch 392 / 1506 - 1886 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0154 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0038 --- Epoch 393 / 1506 - 1887 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0230 Iteration 80, loss = 0.0020 --- Epoch 394 / 1506 - 1888 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0017 --- Epoch 395 / 1506 - 1889 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0021 --- Epoch 396 / 1506 - 1890 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0013 --- Epoch 397 / 1506 - 1891 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0051 --- Epoch 398 / 1506 - 1892 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0034 --- Epoch 399 / 1506 - 1893 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0020 --- Epoch 400 / 1506 - 1894 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0338 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0096 --- Epoch 401 / 1506 - 1895 epochs total Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0026 --- Epoch 402 / 1506 - 1896 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0048 --- Epoch 403 / 1506 - 1897 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0045 --- Epoch 404 / 1506 - 1898 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0065 --- Epoch 405 / 1506 - 1899 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0031 --- Epoch 406 / 1506 - 1900 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0023 --- Epoch 407 / 1506 - 1901 epochs total Iteration 0, loss = 0.0082 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0080 --- Epoch 408 / 1506 - 1902 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0040 --- Epoch 409 / 1506 - 1903 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0079 --- Epoch 410 / 1506 - 1904 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0044 --- Epoch 411 / 1506 - 1905 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0027 --- Epoch 412 / 1506 - 1906 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0148 --- Epoch 413 / 1506 - 1907 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0059 --- Epoch 414 / 1506 - 1908 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0083 Iteration 60, loss = 0.0143 Iteration 80, loss = 0.0011 --- Epoch 415 / 1506 - 1909 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0123 Iteration 80, loss = 0.0021 --- Epoch 416 / 1506 - 1910 epochs total Iteration 0, loss = 0.0178 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0030 --- Epoch 417 / 1506 - 1911 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0039 --- Epoch 418 / 1506 - 1912 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0044 --- Epoch 419 / 1506 - 1913 epochs total Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0100 --- Epoch 420 / 1506 - 1914 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0092 --- Epoch 421 / 1506 - 1915 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0032 --- Epoch 422 / 1506 - 1916 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0023 --- Epoch 423 / 1506 - 1917 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0020 --- Epoch 424 / 1506 - 1918 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0019 --- Epoch 425 / 1506 - 1919 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0043 --- Epoch 426 / 1506 - 1920 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0032 --- Epoch 427 / 1506 - 1921 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0055 --- Epoch 428 / 1506 - 1922 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0040 --- Epoch 429 / 1506 - 1923 epochs total Iteration 0, loss = 0.0120 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0035 --- Epoch 430 / 1506 - 1924 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0034 --- Epoch 431 / 1506 - 1925 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0030 --- Epoch 432 / 1506 - 1926 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0028 --- Epoch 433 / 1506 - 1927 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0030 --- Epoch 434 / 1506 - 1928 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0038 --- Epoch 435 / 1506 - 1929 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0031 --- Epoch 436 / 1506 - 1930 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0026 --- Epoch 437 / 1506 - 1931 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0064 --- Epoch 438 / 1506 - 1932 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0034 --- Epoch 439 / 1506 - 1933 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0027 --- Epoch 440 / 1506 - 1934 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0028 --- Epoch 441 / 1506 - 1935 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0052 --- Epoch 442 / 1506 - 1936 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0032 --- Epoch 443 / 1506 - 1937 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0040 --- Epoch 444 / 1506 - 1938 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0059 --- Epoch 445 / 1506 - 1939 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0153 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0180 Iteration 80, loss = 0.0030 --- Epoch 446 / 1506 - 1940 epochs total Iteration 0, loss = 0.0103 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0061 --- Epoch 447 / 1506 - 1941 epochs total Iteration 0, loss = 0.0096 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0037 --- Epoch 448 / 1506 - 1942 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0064 --- Epoch 449 / 1506 - 1943 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0103 --- Epoch 450 / 1506 - 1944 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0137 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0067 --- Epoch 451 / 1506 - 1945 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0059 --- Epoch 452 / 1506 - 1946 epochs total Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0027 --- Epoch 453 / 1506 - 1947 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0281 --- Epoch 454 / 1506 - 1948 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0043 --- Epoch 455 / 1506 - 1949 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0129 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0022 --- Epoch 456 / 1506 - 1950 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0020 --- Epoch 457 / 1506 - 1951 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0031 --- Epoch 458 / 1506 - 1952 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0021 --- Epoch 459 / 1506 - 1953 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0131 Iteration 80, loss = 0.0066 --- Epoch 460 / 1506 - 1954 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0126 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0045 --- Epoch 461 / 1506 - 1955 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0026 --- Epoch 462 / 1506 - 1956 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0032 --- Epoch 463 / 1506 - 1957 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0059 --- Epoch 464 / 1506 - 1958 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0041 --- Epoch 465 / 1506 - 1959 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0042 --- Epoch 466 / 1506 - 1960 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0193 --- Epoch 467 / 1506 - 1961 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0043 --- Epoch 468 / 1506 - 1962 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0033 --- Epoch 469 / 1506 - 1963 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0051 --- Epoch 470 / 1506 - 1964 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0057 --- Epoch 471 / 1506 - 1965 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0024 --- Epoch 472 / 1506 - 1966 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0111 --- Epoch 473 / 1506 - 1967 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0072 --- Epoch 474 / 1506 - 1968 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0017 --- Epoch 475 / 1506 - 1969 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0045 --- Epoch 476 / 1506 - 1970 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0018 --- Epoch 477 / 1506 - 1971 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0034 --- Epoch 478 / 1506 - 1972 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0082 --- Epoch 479 / 1506 - 1973 epochs total Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0024 --- Epoch 480 / 1506 - 1974 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0025 --- Epoch 481 / 1506 - 1975 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0038 --- Epoch 482 / 1506 - 1976 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0027 --- Epoch 483 / 1506 - 1977 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0028 --- Epoch 484 / 1506 - 1978 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0027 --- Epoch 485 / 1506 - 1979 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0092 --- Epoch 486 / 1506 - 1980 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0027 --- Epoch 487 / 1506 - 1981 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0029 --- Epoch 488 / 1506 - 1982 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0031 --- Epoch 489 / 1506 - 1983 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0018 --- Epoch 490 / 1506 - 1984 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0067 --- Epoch 491 / 1506 - 1985 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0172 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0038 --- Epoch 492 / 1506 - 1986 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0040 --- Epoch 493 / 1506 - 1987 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0041 --- Epoch 494 / 1506 - 1988 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0097 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0014 --- Epoch 495 / 1506 - 1989 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0014 --- Epoch 496 / 1506 - 1990 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0063 --- Epoch 497 / 1506 - 1991 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0060 --- Epoch 498 / 1506 - 1992 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0076 --- Epoch 499 / 1506 - 1993 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0033 --- Epoch 500 / 1506 - 1994 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0111 Iteration 80, loss = 0.0062 --- Epoch 501 / 1506 - 1995 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0187 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0036 --- Epoch 502 / 1506 - 1996 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0117 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0045 --- Epoch 503 / 1506 - 1997 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0068 --- Epoch 504 / 1506 - 1998 epochs total Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0033 --- Epoch 505 / 1506 - 1999 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0035 --- Epoch 506 / 1506 - 2000 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0027 --- Epoch 507 / 1506 - 2001 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0023 --- Epoch 508 / 1506 - 2002 epochs total Iteration 0, loss = 0.0100 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0048 --- Epoch 509 / 1506 - 2003 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0202 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0068 --- Epoch 510 / 1506 - 2004 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0032 --- Epoch 511 / 1506 - 2005 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0036 --- Epoch 512 / 1506 - 2006 epochs total Iteration 0, loss = 0.0070 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0035 --- Epoch 513 / 1506 - 2007 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0134 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0020 --- Epoch 514 / 1506 - 2008 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0042 --- Epoch 515 / 1506 - 2009 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0033 --- Epoch 516 / 1506 - 2010 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0030 --- Epoch 517 / 1506 - 2011 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0023 --- Epoch 518 / 1506 - 2012 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0030 --- Epoch 519 / 1506 - 2013 epochs total Iteration 0, loss = 0.0184 Iteration 20, loss = 0.0127 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0070 --- Epoch 520 / 1506 - 2014 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0031 --- Epoch 521 / 1506 - 2015 epochs total Iteration 0, loss = 0.0718 Iteration 20, loss = 0.0169 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0033 --- Epoch 522 / 1506 - 2016 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0021 --- Epoch 523 / 1506 - 2017 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0102 --- Epoch 524 / 1506 - 2018 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0031 --- Epoch 525 / 1506 - 2019 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0097 --- Epoch 526 / 1506 - 2020 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0050 --- Epoch 527 / 1506 - 2021 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0020 --- Epoch 528 / 1506 - 2022 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0153 --- Epoch 529 / 1506 - 2023 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0189 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0035 --- Epoch 530 / 1506 - 2024 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0040 --- Epoch 531 / 1506 - 2025 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0041 --- Epoch 532 / 1506 - 2026 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0038 --- Epoch 533 / 1506 - 2027 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0041 --- Epoch 534 / 1506 - 2028 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0041 --- Epoch 535 / 1506 - 2029 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0082 Iteration 80, loss = 0.0061 --- Epoch 536 / 1506 - 2030 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0026 --- Epoch 537 / 1506 - 2031 epochs total Iteration 0, loss = 0.0136 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0043 --- Epoch 538 / 1506 - 2032 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0050 --- Epoch 539 / 1506 - 2033 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0032 --- Epoch 540 / 1506 - 2034 epochs total Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0036 --- Epoch 541 / 1506 - 2035 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0035 --- Epoch 542 / 1506 - 2036 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0106 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0034 --- Epoch 543 / 1506 - 2037 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0034 --- Epoch 544 / 1506 - 2038 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0159 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0032 --- Epoch 545 / 1506 - 2039 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0143 Iteration 80, loss = 0.0026 --- Epoch 546 / 1506 - 2040 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0081 --- Epoch 547 / 1506 - 2041 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0036 --- Epoch 548 / 1506 - 2042 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0024 --- Epoch 549 / 1506 - 2043 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0028 --- Epoch 550 / 1506 - 2044 epochs total Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0071 --- Epoch 551 / 1506 - 2045 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0065 --- Epoch 552 / 1506 - 2046 epochs total Iteration 0, loss = 0.0090 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0027 --- Epoch 553 / 1506 - 2047 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0051 --- Epoch 554 / 1506 - 2048 epochs total Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0104 --- Epoch 555 / 1506 - 2049 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0057 --- Epoch 556 / 1506 - 2050 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0023 --- Epoch 557 / 1506 - 2051 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0034 --- Epoch 558 / 1506 - 2052 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0024 --- Epoch 559 / 1506 - 2053 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0050 --- Epoch 560 / 1506 - 2054 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0054 --- Epoch 561 / 1506 - 2055 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0032 --- Epoch 562 / 1506 - 2056 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0059 --- Epoch 563 / 1506 - 2057 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0035 --- Epoch 564 / 1506 - 2058 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0052 --- Epoch 565 / 1506 - 2059 epochs total Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0133 --- Epoch 566 / 1506 - 2060 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0034 --- Epoch 567 / 1506 - 2061 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0028 --- Epoch 568 / 1506 - 2062 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0048 --- Epoch 569 / 1506 - 2063 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0042 --- Epoch 570 / 1506 - 2064 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0082 --- Epoch 571 / 1506 - 2065 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0025 --- Epoch 572 / 1506 - 2066 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0049 --- Epoch 573 / 1506 - 2067 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0030 --- Epoch 574 / 1506 - 2068 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0067 --- Epoch 575 / 1506 - 2069 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0038 --- Epoch 576 / 1506 - 2070 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0028 --- Epoch 577 / 1506 - 2071 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0032 --- Epoch 578 / 1506 - 2072 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0035 --- Epoch 579 / 1506 - 2073 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0117 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0027 --- Epoch 580 / 1506 - 2074 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0036 --- Epoch 581 / 1506 - 2075 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0043 --- Epoch 582 / 1506 - 2076 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0025 --- Epoch 583 / 1506 - 2077 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0030 --- Epoch 584 / 1506 - 2078 epochs total Iteration 0, loss = 0.0120 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0053 --- Epoch 585 / 1506 - 2079 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0054 --- Epoch 586 / 1506 - 2080 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0024 --- Epoch 587 / 1506 - 2081 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0025 --- Epoch 588 / 1506 - 2082 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0052 --- Epoch 589 / 1506 - 2083 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0034 --- Epoch 590 / 1506 - 2084 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0027 --- Epoch 591 / 1506 - 2085 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0009 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0040 --- Epoch 592 / 1506 - 2086 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0065 --- Epoch 593 / 1506 - 2087 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0099 --- Epoch 594 / 1506 - 2088 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0033 --- Epoch 595 / 1506 - 2089 epochs total Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0065 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0037 --- Epoch 596 / 1506 - 2090 epochs total Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0116 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0031 --- Epoch 597 / 1506 - 2091 epochs total Iteration 0, loss = 0.0131 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0042 --- Epoch 598 / 1506 - 2092 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0116 --- Epoch 599 / 1506 - 2093 epochs total Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0023 --- Epoch 600 / 1506 - 2094 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0022 --- Epoch 601 / 1506 - 2095 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0083 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0079 --- Epoch 602 / 1506 - 2096 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0052 --- Epoch 603 / 1506 - 2097 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0065 --- Epoch 604 / 1506 - 2098 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0150 --- Epoch 605 / 1506 - 2099 epochs total Iteration 0, loss = 0.0085 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0017 --- Epoch 606 / 1506 - 2100 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0019 --- Epoch 607 / 1506 - 2101 epochs total Iteration 0, loss = 0.0083 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0062 --- Epoch 608 / 1506 - 2102 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0045 --- Epoch 609 / 1506 - 2103 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0028 --- Epoch 610 / 1506 - 2104 epochs total Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0034 --- Epoch 611 / 1506 - 2105 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0089 --- Epoch 612 / 1506 - 2106 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0033 --- Epoch 613 / 1506 - 2107 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0026 --- Epoch 614 / 1506 - 2108 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0037 --- Epoch 615 / 1506 - 2109 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0192 Iteration 80, loss = 0.0018 --- Epoch 616 / 1506 - 2110 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0110 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0064 --- Epoch 617 / 1506 - 2111 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0030 --- Epoch 618 / 1506 - 2112 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0027 --- Epoch 619 / 1506 - 2113 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0063 --- Epoch 620 / 1506 - 2114 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0025 --- Epoch 621 / 1506 - 2115 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0108 --- Epoch 622 / 1506 - 2116 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0052 --- Epoch 623 / 1506 - 2117 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0049 --- Epoch 624 / 1506 - 2118 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0055 --- Epoch 625 / 1506 - 2119 epochs total Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0040 --- Epoch 626 / 1506 - 2120 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0133 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0054 --- Epoch 627 / 1506 - 2121 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0027 --- Epoch 628 / 1506 - 2122 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0063 --- Epoch 629 / 1506 - 2123 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0034 --- Epoch 630 / 1506 - 2124 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0029 --- Epoch 631 / 1506 - 2125 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0041 --- Epoch 632 / 1506 - 2126 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0055 --- Epoch 633 / 1506 - 2127 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0053 --- Epoch 634 / 1506 - 2128 epochs total Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0080 --- Epoch 635 / 1506 - 2129 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0040 --- Epoch 636 / 1506 - 2130 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0071 --- Epoch 637 / 1506 - 2131 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0114 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0037 --- Epoch 638 / 1506 - 2132 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0071 --- Epoch 639 / 1506 - 2133 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0036 --- Epoch 640 / 1506 - 2134 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0046 --- Epoch 641 / 1506 - 2135 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0052 --- Epoch 642 / 1506 - 2136 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0046 --- Epoch 643 / 1506 - 2137 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0029 --- Epoch 644 / 1506 - 2138 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0020 --- Epoch 645 / 1506 - 2139 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0017 --- Epoch 646 / 1506 - 2140 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0196 --- Epoch 647 / 1506 - 2141 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0030 --- Epoch 648 / 1506 - 2142 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0058 --- Epoch 649 / 1506 - 2143 epochs total Iteration 0, loss = 0.0223 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0050 --- Epoch 650 / 1506 - 2144 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0042 --- Epoch 651 / 1506 - 2145 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0203 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0035 --- Epoch 652 / 1506 - 2146 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0104 --- Epoch 653 / 1506 - 2147 epochs total Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0039 --- Epoch 654 / 1506 - 2148 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0015 --- Epoch 655 / 1506 - 2149 epochs total Iteration 0, loss = 0.0185 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0030 --- Epoch 656 / 1506 - 2150 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0036 --- Epoch 657 / 1506 - 2151 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0103 --- Epoch 658 / 1506 - 2152 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0043 --- Epoch 659 / 1506 - 2153 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0092 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0217 --- Epoch 660 / 1506 - 2154 epochs total Iteration 0, loss = 0.0090 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0031 --- Epoch 661 / 1506 - 2155 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0039 --- Epoch 662 / 1506 - 2156 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0039 --- Epoch 663 / 1506 - 2157 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0032 --- Epoch 664 / 1506 - 2158 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0025 --- Epoch 665 / 1506 - 2159 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0041 --- Epoch 666 / 1506 - 2160 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0106 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0031 --- Epoch 667 / 1506 - 2161 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0109 --- Epoch 668 / 1506 - 2162 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0032 --- Epoch 669 / 1506 - 2163 epochs total Iteration 0, loss = 0.0144 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0052 --- Epoch 670 / 1506 - 2164 epochs total Iteration 0, loss = 0.0083 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0043 --- Epoch 671 / 1506 - 2165 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0059 --- Epoch 672 / 1506 - 2166 epochs total Iteration 0, loss = 0.0136 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0085 Iteration 80, loss = 0.0084 --- Epoch 673 / 1506 - 2167 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0048 --- Epoch 674 / 1506 - 2168 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0106 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0019 --- Epoch 675 / 1506 - 2169 epochs total Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0046 --- Epoch 676 / 1506 - 2170 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0096 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0049 --- Epoch 677 / 1506 - 2171 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0040 --- Epoch 678 / 1506 - 2172 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0066 --- Epoch 679 / 1506 - 2173 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0064 --- Epoch 680 / 1506 - 2174 epochs total Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0122 --- Epoch 681 / 1506 - 2175 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0062 --- Epoch 682 / 1506 - 2176 epochs total Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0042 --- Epoch 683 / 1506 - 2177 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0010 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0055 --- Epoch 684 / 1506 - 2178 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0072 --- Epoch 685 / 1506 - 2179 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0026 --- Epoch 686 / 1506 - 2180 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0079 --- Epoch 687 / 1506 - 2181 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0122 --- Epoch 688 / 1506 - 2182 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0038 --- Epoch 689 / 1506 - 2183 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0034 --- Epoch 690 / 1506 - 2184 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0021 --- Epoch 691 / 1506 - 2185 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0253 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0061 --- Epoch 692 / 1506 - 2186 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0049 --- Epoch 693 / 1506 - 2187 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0074 --- Epoch 694 / 1506 - 2188 epochs total Iteration 0, loss = 0.0254 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0268 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0040 --- Epoch 695 / 1506 - 2189 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0024 --- Epoch 696 / 1506 - 2190 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0028 --- Epoch 697 / 1506 - 2191 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0033 --- Epoch 698 / 1506 - 2192 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0023 --- Epoch 699 / 1506 - 2193 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0078 --- Epoch 700 / 1506 - 2194 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0045 --- Epoch 701 / 1506 - 2195 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0054 --- Epoch 702 / 1506 - 2196 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0019 --- Epoch 703 / 1506 - 2197 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0136 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0019 --- Epoch 704 / 1506 - 2198 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0014 --- Epoch 705 / 1506 - 2199 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0016 --- Epoch 706 / 1506 - 2200 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0049 --- Epoch 707 / 1506 - 2201 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0193 Iteration 80, loss = 0.0206 --- Epoch 708 / 1506 - 2202 epochs total Iteration 0, loss = 0.0090 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0036 --- Epoch 709 / 1506 - 2203 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0106 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0025 --- Epoch 710 / 1506 - 2204 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0141 Iteration 80, loss = 0.0069 --- Epoch 711 / 1506 - 2205 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0037 --- Epoch 712 / 1506 - 2206 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0087 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0038 --- Epoch 713 / 1506 - 2207 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0041 --- Epoch 714 / 1506 - 2208 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0073 --- Epoch 715 / 1506 - 2209 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0064 --- Epoch 716 / 1506 - 2210 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0082 --- Epoch 717 / 1506 - 2211 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0029 --- Epoch 718 / 1506 - 2212 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0133 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0052 --- Epoch 719 / 1506 - 2213 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0178 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0036 --- Epoch 720 / 1506 - 2214 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0067 --- Epoch 721 / 1506 - 2215 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0031 --- Epoch 722 / 1506 - 2216 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0154 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0028 --- Epoch 723 / 1506 - 2217 epochs total Iteration 0, loss = 0.0085 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0038 --- Epoch 724 / 1506 - 2218 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0159 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0059 --- Epoch 725 / 1506 - 2219 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0059 --- Epoch 726 / 1506 - 2220 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0130 Iteration 40, loss = 0.0184 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0013 --- Epoch 727 / 1506 - 2221 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0032 --- Epoch 728 / 1506 - 2222 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0082 --- Epoch 729 / 1506 - 2223 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0086 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0042 --- Epoch 730 / 1506 - 2224 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0036 --- Epoch 731 / 1506 - 2225 epochs total Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0284 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0043 --- Epoch 732 / 1506 - 2226 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0090 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0035 --- Epoch 733 / 1506 - 2227 epochs total Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0036 --- Epoch 734 / 1506 - 2228 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0027 --- Epoch 735 / 1506 - 2229 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0041 --- Epoch 736 / 1506 - 2230 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0064 --- Epoch 737 / 1506 - 2231 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0035 --- Epoch 738 / 1506 - 2232 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0010 Iteration 80, loss = 0.0041 --- Epoch 739 / 1506 - 2233 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0032 --- Epoch 740 / 1506 - 2234 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0027 --- Epoch 741 / 1506 - 2235 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0030 --- Epoch 742 / 1506 - 2236 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0077 --- Epoch 743 / 1506 - 2237 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0096 Iteration 80, loss = 0.0046 --- Epoch 744 / 1506 - 2238 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0045 --- Epoch 745 / 1506 - 2239 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0025 --- Epoch 746 / 1506 - 2240 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0025 --- Epoch 747 / 1506 - 2241 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0023 --- Epoch 748 / 1506 - 2242 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0084 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0035 --- Epoch 749 / 1506 - 2243 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0025 --- Epoch 750 / 1506 - 2244 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0047 --- Epoch 751 / 1506 - 2245 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0095 --- Epoch 752 / 1506 - 2246 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0018 --- Epoch 753 / 1506 - 2247 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0200 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0024 --- Epoch 754 / 1506 - 2248 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0024 --- Epoch 755 / 1506 - 2249 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0034 --- Epoch 756 / 1506 - 2250 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0154 Iteration 60, loss = 0.0011 Iteration 80, loss = 0.0027 --- Epoch 757 / 1506 - 2251 epochs total Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0075 --- Epoch 758 / 1506 - 2252 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0040 --- Epoch 759 / 1506 - 2253 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0137 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0076 --- Epoch 760 / 1506 - 2254 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0140 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0039 --- Epoch 761 / 1506 - 2255 epochs total Iteration 0, loss = 0.0116 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0015 --- Epoch 762 / 1506 - 2256 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0184 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0053 --- Epoch 763 / 1506 - 2257 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0179 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0028 --- Epoch 764 / 1506 - 2258 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0040 --- Epoch 765 / 1506 - 2259 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0046 --- Epoch 766 / 1506 - 2260 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0056 --- Epoch 767 / 1506 - 2261 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0024 --- Epoch 768 / 1506 - 2262 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0054 --- Epoch 769 / 1506 - 2263 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0027 --- Epoch 770 / 1506 - 2264 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0035 --- Epoch 771 / 1506 - 2265 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0021 --- Epoch 772 / 1506 - 2266 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0039 --- Epoch 773 / 1506 - 2267 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0221 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0035 --- Epoch 774 / 1506 - 2268 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0035 --- Epoch 775 / 1506 - 2269 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0051 --- Epoch 776 / 1506 - 2270 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0088 --- Epoch 777 / 1506 - 2271 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0159 --- Epoch 778 / 1506 - 2272 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0057 --- Epoch 779 / 1506 - 2273 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0048 --- Epoch 780 / 1506 - 2274 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0032 --- Epoch 781 / 1506 - 2275 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0254 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0223 --- Epoch 782 / 1506 - 2276 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0072 --- Epoch 783 / 1506 - 2277 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0018 --- Epoch 784 / 1506 - 2278 epochs total Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0037 --- Epoch 785 / 1506 - 2279 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0037 --- Epoch 786 / 1506 - 2280 epochs total Iteration 0, loss = 0.0141 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0043 --- Epoch 787 / 1506 - 2281 epochs total Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0097 --- Epoch 788 / 1506 - 2282 epochs total Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0011 Iteration 80, loss = 0.0035 --- Epoch 789 / 1506 - 2283 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0053 --- Epoch 790 / 1506 - 2284 epochs total Iteration 0, loss = 0.0178 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0172 --- Epoch 791 / 1506 - 2285 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0057 --- Epoch 792 / 1506 - 2286 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0028 --- Epoch 793 / 1506 - 2287 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0054 --- Epoch 794 / 1506 - 2288 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0049 --- Epoch 795 / 1506 - 2289 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0031 --- Epoch 796 / 1506 - 2290 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0047 --- Epoch 797 / 1506 - 2291 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0089 Iteration 60, loss = 0.0138 Iteration 80, loss = 0.0059 --- Epoch 798 / 1506 - 2292 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0013 --- Epoch 799 / 1506 - 2293 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0044 --- Epoch 800 / 1506 - 2294 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0039 --- Epoch 801 / 1506 - 2295 epochs total Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0061 --- Epoch 802 / 1506 - 2296 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0039 --- Epoch 803 / 1506 - 2297 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0034 --- Epoch 804 / 1506 - 2298 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0096 Iteration 80, loss = 0.0029 --- Epoch 805 / 1506 - 2299 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0021 --- Epoch 806 / 1506 - 2300 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0021 --- Epoch 807 / 1506 - 2301 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0030 --- Epoch 808 / 1506 - 2302 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0035 --- Epoch 809 / 1506 - 2303 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0023 --- Epoch 810 / 1506 - 2304 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0032 --- Epoch 811 / 1506 - 2305 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0032 --- Epoch 812 / 1506 - 2306 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0106 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0045 --- Epoch 813 / 1506 - 2307 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0053 --- Epoch 814 / 1506 - 2308 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0023 --- Epoch 815 / 1506 - 2309 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0143 Iteration 80, loss = 0.0052 --- Epoch 816 / 1506 - 2310 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0159 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0075 --- Epoch 817 / 1506 - 2311 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0053 --- Epoch 818 / 1506 - 2312 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0123 Iteration 80, loss = 0.0028 --- Epoch 819 / 1506 - 2313 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0072 --- Epoch 820 / 1506 - 2314 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0043 --- Epoch 821 / 1506 - 2315 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0119 --- Epoch 822 / 1506 - 2316 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0067 --- Epoch 823 / 1506 - 2317 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0189 --- Epoch 824 / 1506 - 2318 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0025 --- Epoch 825 / 1506 - 2319 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0041 --- Epoch 826 / 1506 - 2320 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0026 --- Epoch 827 / 1506 - 2321 epochs total Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0081 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0086 --- Epoch 828 / 1506 - 2322 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0082 --- Epoch 829 / 1506 - 2323 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0180 Iteration 80, loss = 0.0028 --- Epoch 830 / 1506 - 2324 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0226 Iteration 80, loss = 0.0020 --- Epoch 831 / 1506 - 2325 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0030 --- Epoch 832 / 1506 - 2326 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0059 --- Epoch 833 / 1506 - 2327 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0126 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0116 --- Epoch 834 / 1506 - 2328 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0222 --- Epoch 835 / 1506 - 2329 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0019 --- Epoch 836 / 1506 - 2330 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0128 --- Epoch 837 / 1506 - 2331 epochs total Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0037 --- Epoch 838 / 1506 - 2332 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0083 Iteration 80, loss = 0.0038 --- Epoch 839 / 1506 - 2333 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0023 --- Epoch 840 / 1506 - 2334 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0082 --- Epoch 841 / 1506 - 2335 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0043 --- Epoch 842 / 1506 - 2336 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0054 --- Epoch 843 / 1506 - 2337 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0030 --- Epoch 844 / 1506 - 2338 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0191 Iteration 80, loss = 0.0067 --- Epoch 845 / 1506 - 2339 epochs total Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0040 --- Epoch 846 / 1506 - 2340 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0036 --- Epoch 847 / 1506 - 2341 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0042 --- Epoch 848 / 1506 - 2342 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0045 --- Epoch 849 / 1506 - 2343 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0035 --- Epoch 850 / 1506 - 2344 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0065 --- Epoch 851 / 1506 - 2345 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0035 --- Epoch 852 / 1506 - 2346 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0046 --- Epoch 853 / 1506 - 2347 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0180 --- Epoch 854 / 1506 - 2348 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0030 --- Epoch 855 / 1506 - 2349 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0026 --- Epoch 856 / 1506 - 2350 epochs total Iteration 0, loss = 0.0120 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0104 --- Epoch 857 / 1506 - 2351 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0053 --- Epoch 858 / 1506 - 2352 epochs total Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0126 --- Epoch 859 / 1506 - 2353 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0056 --- Epoch 860 / 1506 - 2354 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0057 --- Epoch 861 / 1506 - 2355 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0027 --- Epoch 862 / 1506 - 2356 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0253 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0052 --- Epoch 863 / 1506 - 2357 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0281 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0073 --- Epoch 864 / 1506 - 2358 epochs total Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0032 --- Epoch 865 / 1506 - 2359 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0192 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0052 --- Epoch 866 / 1506 - 2360 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0048 --- Epoch 867 / 1506 - 2361 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0010 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0034 --- Epoch 868 / 1506 - 2362 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0036 --- Epoch 869 / 1506 - 2363 epochs total Iteration 0, loss = 0.0214 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0079 --- Epoch 870 / 1506 - 2364 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0041 --- Epoch 871 / 1506 - 2365 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0017 --- Epoch 872 / 1506 - 2366 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0054 --- Epoch 873 / 1506 - 2367 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0027 --- Epoch 874 / 1506 - 2368 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0033 --- Epoch 875 / 1506 - 2369 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0141 Iteration 80, loss = 0.0049 --- Epoch 876 / 1506 - 2370 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0037 --- Epoch 877 / 1506 - 2371 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0027 --- Epoch 878 / 1506 - 2372 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0047 --- Epoch 879 / 1506 - 2373 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0123 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0038 --- Epoch 880 / 1506 - 2374 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0065 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0024 --- Epoch 881 / 1506 - 2375 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0098 --- Epoch 882 / 1506 - 2376 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0027 --- Epoch 883 / 1506 - 2377 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0053 --- Epoch 884 / 1506 - 2378 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0137 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0026 --- Epoch 885 / 1506 - 2379 epochs total Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0031 --- Epoch 886 / 1506 - 2380 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0029 --- Epoch 887 / 1506 - 2381 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0138 --- Epoch 888 / 1506 - 2382 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0031 --- Epoch 889 / 1506 - 2383 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0025 --- Epoch 890 / 1506 - 2384 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0084 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0062 --- Epoch 891 / 1506 - 2385 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0109 --- Epoch 892 / 1506 - 2386 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0023 --- Epoch 893 / 1506 - 2387 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0044 --- Epoch 894 / 1506 - 2388 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0033 --- Epoch 895 / 1506 - 2389 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0059 --- Epoch 896 / 1506 - 2390 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0041 --- Epoch 897 / 1506 - 2391 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0046 --- Epoch 898 / 1506 - 2392 epochs total Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0046 --- Epoch 899 / 1506 - 2393 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0043 --- Epoch 900 / 1506 - 2394 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0184 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0025 --- Epoch 901 / 1506 - 2395 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0029 --- Epoch 902 / 1506 - 2396 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0024 --- Epoch 903 / 1506 - 2397 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0025 --- Epoch 904 / 1506 - 2398 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0034 --- Epoch 905 / 1506 - 2399 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0027 --- Epoch 906 / 1506 - 2400 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0165 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0018 --- Epoch 907 / 1506 - 2401 epochs total Iteration 0, loss = 0.0096 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0031 --- Epoch 908 / 1506 - 2402 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0026 --- Epoch 909 / 1506 - 2403 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0055 --- Epoch 910 / 1506 - 2404 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0043 --- Epoch 911 / 1506 - 2405 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0030 --- Epoch 912 / 1506 - 2406 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0060 --- Epoch 913 / 1506 - 2407 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0031 --- Epoch 914 / 1506 - 2408 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0025 --- Epoch 915 / 1506 - 2409 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0052 --- Epoch 916 / 1506 - 2410 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0018 --- Epoch 917 / 1506 - 2411 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0019 --- Epoch 918 / 1506 - 2412 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0040 --- Epoch 919 / 1506 - 2413 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0185 --- Epoch 920 / 1506 - 2414 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0060 --- Epoch 921 / 1506 - 2415 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0029 --- Epoch 922 / 1506 - 2416 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0025 --- Epoch 923 / 1506 - 2417 epochs total Iteration 0, loss = 0.0144 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0031 --- Epoch 924 / 1506 - 2418 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0082 Iteration 80, loss = 0.0052 --- Epoch 925 / 1506 - 2419 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0030 --- Epoch 926 / 1506 - 2420 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0035 --- Epoch 927 / 1506 - 2421 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0038 --- Epoch 928 / 1506 - 2422 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0010 Iteration 80, loss = 0.0032 --- Epoch 929 / 1506 - 2423 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0025 --- Epoch 930 / 1506 - 2424 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0077 --- Epoch 931 / 1506 - 2425 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0043 --- Epoch 932 / 1506 - 2426 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0047 --- Epoch 933 / 1506 - 2427 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0017 --- Epoch 934 / 1506 - 2428 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0027 --- Epoch 935 / 1506 - 2429 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0077 --- Epoch 936 / 1506 - 2430 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0088 --- Epoch 937 / 1506 - 2431 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0053 --- Epoch 938 / 1506 - 2432 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0027 --- Epoch 939 / 1506 - 2433 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0084 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0078 --- Epoch 940 / 1506 - 2434 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0055 --- Epoch 941 / 1506 - 2435 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0040 --- Epoch 942 / 1506 - 2436 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0036 --- Epoch 943 / 1506 - 2437 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0032 --- Epoch 944 / 1506 - 2438 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0122 --- Epoch 945 / 1506 - 2439 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0024 --- Epoch 946 / 1506 - 2440 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0022 --- Epoch 947 / 1506 - 2441 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0031 --- Epoch 948 / 1506 - 2442 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0075 --- Epoch 949 / 1506 - 2443 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0113 --- Epoch 950 / 1506 - 2444 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0032 --- Epoch 951 / 1506 - 2445 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0089 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0024 --- Epoch 952 / 1506 - 2446 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0096 Iteration 80, loss = 0.0057 --- Epoch 953 / 1506 - 2447 epochs total Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0030 --- Epoch 954 / 1506 - 2448 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0034 --- Epoch 955 / 1506 - 2449 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0069 --- Epoch 956 / 1506 - 2450 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0041 --- Epoch 957 / 1506 - 2451 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0091 --- Epoch 958 / 1506 - 2452 epochs total Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0035 --- Epoch 959 / 1506 - 2453 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0039 --- Epoch 960 / 1506 - 2454 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0042 --- Epoch 961 / 1506 - 2455 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0032 --- Epoch 962 / 1506 - 2456 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0280 --- Epoch 963 / 1506 - 2457 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0035 --- Epoch 964 / 1506 - 2458 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0031 --- Epoch 965 / 1506 - 2459 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0032 --- Epoch 966 / 1506 - 2460 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0064 --- Epoch 967 / 1506 - 2461 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0041 --- Epoch 968 / 1506 - 2462 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0055 --- Epoch 969 / 1506 - 2463 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0055 --- Epoch 970 / 1506 - 2464 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0045 --- Epoch 971 / 1506 - 2465 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0028 --- Epoch 972 / 1506 - 2466 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0042 --- Epoch 973 / 1506 - 2467 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0034 --- Epoch 974 / 1506 - 2468 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0051 --- Epoch 975 / 1506 - 2469 epochs total Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0070 --- Epoch 976 / 1506 - 2470 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0041 --- Epoch 977 / 1506 - 2471 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0121 Iteration 80, loss = 0.0032 --- Epoch 978 / 1506 - 2472 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0068 --- Epoch 979 / 1506 - 2473 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0047 --- Epoch 980 / 1506 - 2474 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0009 Iteration 80, loss = 0.0060 --- Epoch 981 / 1506 - 2475 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0055 --- Epoch 982 / 1506 - 2476 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0045 --- Epoch 983 / 1506 - 2477 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0037 --- Epoch 984 / 1506 - 2478 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0024 --- Epoch 985 / 1506 - 2479 epochs total Iteration 0, loss = 0.0149 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0012 --- Epoch 986 / 1506 - 2480 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0057 --- Epoch 987 / 1506 - 2481 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0027 --- Epoch 988 / 1506 - 2482 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0024 --- Epoch 989 / 1506 - 2483 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0063 --- Epoch 990 / 1506 - 2484 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0040 --- Epoch 991 / 1506 - 2485 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0086 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0036 --- Epoch 992 / 1506 - 2486 epochs total Iteration 0, loss = 0.0070 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0010 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0043 --- Epoch 993 / 1506 - 2487 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0083 Iteration 80, loss = 0.0063 --- Epoch 994 / 1506 - 2488 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0074 --- Epoch 995 / 1506 - 2489 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0193 Iteration 80, loss = 0.0030 --- Epoch 996 / 1506 - 2490 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0037 --- Epoch 997 / 1506 - 2491 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0026 --- Epoch 998 / 1506 - 2492 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0111 --- Epoch 999 / 1506 - 2493 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0027 --- Epoch 1000 / 1506 - 2494 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0020 --- Epoch 1001 / 1506 - 2495 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0083 Iteration 80, loss = 0.0071 --- Epoch 1002 / 1506 - 2496 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0048 --- Epoch 1003 / 1506 - 2497 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0040 --- Epoch 1004 / 1506 - 2498 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0016 --- Epoch 1005 / 1506 - 2499 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0018 --- Epoch 1006 / 1506 - 2500 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0036 --- Epoch 1007 / 1506 - 2501 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0036 --- Epoch 1008 / 1506 - 2502 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0047 --- Epoch 1009 / 1506 - 2503 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0035 --- Epoch 1010 / 1506 - 2504 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0069 --- Epoch 1011 / 1506 - 2505 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0133 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0210 Iteration 80, loss = 0.0117 --- Epoch 1012 / 1506 - 2506 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0020 --- Epoch 1013 / 1506 - 2507 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0050 --- Epoch 1014 / 1506 - 2508 epochs total Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0020 --- Epoch 1015 / 1506 - 2509 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0042 --- Epoch 1016 / 1506 - 2510 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0028 --- Epoch 1017 / 1506 - 2511 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0058 --- Epoch 1018 / 1506 - 2512 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0036 --- Epoch 1019 / 1506 - 2513 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0048 --- Epoch 1020 / 1506 - 2514 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0157 Iteration 80, loss = 0.0089 --- Epoch 1021 / 1506 - 2515 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0023 --- Epoch 1022 / 1506 - 2516 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0044 --- Epoch 1023 / 1506 - 2517 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0133 Iteration 80, loss = 0.0038 --- Epoch 1024 / 1506 - 2518 epochs total Iteration 0, loss = 0.0214 Iteration 20, loss = 0.0124 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0083 Iteration 80, loss = 0.0062 --- Epoch 1025 / 1506 - 2519 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0086 --- Epoch 1026 / 1506 - 2520 epochs total Iteration 0, loss = 0.0213 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0056 --- Epoch 1027 / 1506 - 2521 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0139 Iteration 80, loss = 0.0099 --- Epoch 1028 / 1506 - 2522 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0023 --- Epoch 1029 / 1506 - 2523 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0031 --- Epoch 1030 / 1506 - 2524 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0024 --- Epoch 1031 / 1506 - 2525 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0025 --- Epoch 1032 / 1506 - 2526 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0020 --- Epoch 1033 / 1506 - 2527 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0032 --- Epoch 1034 / 1506 - 2528 epochs total Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0064 --- Epoch 1035 / 1506 - 2529 epochs total Iteration 0, loss = 0.0129 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0089 --- Epoch 1036 / 1506 - 2530 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0056 --- Epoch 1037 / 1506 - 2531 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0054 --- Epoch 1038 / 1506 - 2532 epochs total Iteration 0, loss = 0.0070 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0060 --- Epoch 1039 / 1506 - 2533 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0037 --- Epoch 1040 / 1506 - 2534 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0032 --- Epoch 1041 / 1506 - 2535 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0044 --- Epoch 1042 / 1506 - 2536 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0040 --- Epoch 1043 / 1506 - 2537 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0042 --- Epoch 1044 / 1506 - 2538 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0022 --- Epoch 1045 / 1506 - 2539 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0051 --- Epoch 1046 / 1506 - 2540 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0020 --- Epoch 1047 / 1506 - 2541 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0040 --- Epoch 1048 / 1506 - 2542 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0020 --- Epoch 1049 / 1506 - 2543 epochs total Iteration 0, loss = 0.0131 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0074 --- Epoch 1050 / 1506 - 2544 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0058 --- Epoch 1051 / 1506 - 2545 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0062 --- Epoch 1052 / 1506 - 2546 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0084 --- Epoch 1053 / 1506 - 2547 epochs total Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0133 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0061 --- Epoch 1054 / 1506 - 2548 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0056 --- Epoch 1055 / 1506 - 2549 epochs total Iteration 0, loss = 0.0129 Iteration 20, loss = 0.0138 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0060 --- Epoch 1056 / 1506 - 2550 epochs total Iteration 0, loss = 0.0150 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0040 --- Epoch 1057 / 1506 - 2551 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0033 --- Epoch 1058 / 1506 - 2552 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0078 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0019 --- Epoch 1059 / 1506 - 2553 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0070 --- Epoch 1060 / 1506 - 2554 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0172 Iteration 80, loss = 0.0061 --- Epoch 1061 / 1506 - 2555 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0018 --- Epoch 1062 / 1506 - 2556 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0044 --- Epoch 1063 / 1506 - 2557 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0138 --- Epoch 1064 / 1506 - 2558 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0096 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0029 --- Epoch 1065 / 1506 - 2559 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0046 --- Epoch 1066 / 1506 - 2560 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0030 --- Epoch 1067 / 1506 - 2561 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0029 --- Epoch 1068 / 1506 - 2562 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0059 --- Epoch 1069 / 1506 - 2563 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0029 --- Epoch 1070 / 1506 - 2564 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0060 --- Epoch 1071 / 1506 - 2565 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0045 --- Epoch 1072 / 1506 - 2566 epochs total Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0034 --- Epoch 1073 / 1506 - 2567 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0037 --- Epoch 1074 / 1506 - 2568 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0032 --- Epoch 1075 / 1506 - 2569 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0035 --- Epoch 1076 / 1506 - 2570 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0068 --- Epoch 1077 / 1506 - 2571 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0123 Iteration 80, loss = 0.0056 --- Epoch 1078 / 1506 - 2572 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0031 --- Epoch 1079 / 1506 - 2573 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0014 --- Epoch 1080 / 1506 - 2574 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0056 --- Epoch 1081 / 1506 - 2575 epochs total Iteration 0, loss = 0.0082 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0222 --- Epoch 1082 / 1506 - 2576 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0062 --- Epoch 1083 / 1506 - 2577 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0068 --- Epoch 1084 / 1506 - 2578 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0050 --- Epoch 1085 / 1506 - 2579 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0034 --- Epoch 1086 / 1506 - 2580 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0047 --- Epoch 1087 / 1506 - 2581 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0058 --- Epoch 1088 / 1506 - 2582 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0025 --- Epoch 1089 / 1506 - 2583 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0034 --- Epoch 1090 / 1506 - 2584 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0046 --- Epoch 1091 / 1506 - 2585 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0033 --- Epoch 1092 / 1506 - 2586 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0026 --- Epoch 1093 / 1506 - 2587 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0038 --- Epoch 1094 / 1506 - 2588 epochs total Iteration 0, loss = 0.0135 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0027 --- Epoch 1095 / 1506 - 2589 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0027 --- Epoch 1096 / 1506 - 2590 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0031 --- Epoch 1097 / 1506 - 2591 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0034 --- Epoch 1098 / 1506 - 2592 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0067 --- Epoch 1099 / 1506 - 2593 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0025 --- Epoch 1100 / 1506 - 2594 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0129 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0030 --- Epoch 1101 / 1506 - 2595 epochs total Iteration 0, loss = 0.0254 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0033 --- Epoch 1102 / 1506 - 2596 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0049 --- Epoch 1103 / 1506 - 2597 epochs total Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0028 --- Epoch 1104 / 1506 - 2598 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0051 --- Epoch 1105 / 1506 - 2599 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0106 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0037 --- Epoch 1106 / 1506 - 2600 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0043 --- Epoch 1107 / 1506 - 2601 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0030 --- Epoch 1108 / 1506 - 2602 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0049 --- Epoch 1109 / 1506 - 2603 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0025 --- Epoch 1110 / 1506 - 2604 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0079 --- Epoch 1111 / 1506 - 2605 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0031 --- Epoch 1112 / 1506 - 2606 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0047 --- Epoch 1113 / 1506 - 2607 epochs total Iteration 0, loss = 0.0084 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0024 --- Epoch 1114 / 1506 - 2608 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0057 --- Epoch 1115 / 1506 - 2609 epochs total Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0088 --- Epoch 1116 / 1506 - 2610 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0027 --- Epoch 1117 / 1506 - 2611 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0054 --- Epoch 1118 / 1506 - 2612 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0024 --- Epoch 1119 / 1506 - 2613 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0029 --- Epoch 1120 / 1506 - 2614 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0020 --- Epoch 1121 / 1506 - 2615 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0067 --- Epoch 1122 / 1506 - 2616 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0057 --- Epoch 1123 / 1506 - 2617 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0025 --- Epoch 1124 / 1506 - 2618 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0019 --- Epoch 1125 / 1506 - 2619 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0088 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0253 --- Epoch 1126 / 1506 - 2620 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0077 --- Epoch 1127 / 1506 - 2621 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0046 --- Epoch 1128 / 1506 - 2622 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0028 --- Epoch 1129 / 1506 - 2623 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0022 --- Epoch 1130 / 1506 - 2624 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0029 --- Epoch 1131 / 1506 - 2625 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0114 --- Epoch 1132 / 1506 - 2626 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0016 --- Epoch 1133 / 1506 - 2627 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0090 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0024 --- Epoch 1134 / 1506 - 2628 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0089 --- Epoch 1135 / 1506 - 2629 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0065 --- Epoch 1136 / 1506 - 2630 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0037 --- Epoch 1137 / 1506 - 2631 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0124 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0033 --- Epoch 1138 / 1506 - 2632 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0019 --- Epoch 1139 / 1506 - 2633 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0018 --- Epoch 1140 / 1506 - 2634 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0035 --- Epoch 1141 / 1506 - 2635 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0037 --- Epoch 1142 / 1506 - 2636 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0090 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0023 --- Epoch 1143 / 1506 - 2637 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0065 --- Epoch 1144 / 1506 - 2638 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0039 --- Epoch 1145 / 1506 - 2639 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0023 --- Epoch 1146 / 1506 - 2640 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0075 --- Epoch 1147 / 1506 - 2641 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0070 --- Epoch 1148 / 1506 - 2642 epochs total Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0031 --- Epoch 1149 / 1506 - 2643 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0046 --- Epoch 1150 / 1506 - 2644 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0054 --- Epoch 1151 / 1506 - 2645 epochs total Iteration 0, loss = 0.0176 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0030 --- Epoch 1152 / 1506 - 2646 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0083 --- Epoch 1153 / 1506 - 2647 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0054 --- Epoch 1154 / 1506 - 2648 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0039 --- Epoch 1155 / 1506 - 2649 epochs total Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0040 --- Epoch 1156 / 1506 - 2650 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0038 --- Epoch 1157 / 1506 - 2651 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0084 --- Epoch 1158 / 1506 - 2652 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0024 --- Epoch 1159 / 1506 - 2653 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0042 --- Epoch 1160 / 1506 - 2654 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0027 --- Epoch 1161 / 1506 - 2655 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0030 --- Epoch 1162 / 1506 - 2656 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0060 --- Epoch 1163 / 1506 - 2657 epochs total Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0053 --- Epoch 1164 / 1506 - 2658 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0287 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0042 --- Epoch 1165 / 1506 - 2659 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0024 --- Epoch 1166 / 1506 - 2660 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0022 --- Epoch 1167 / 1506 - 2661 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0024 --- Epoch 1168 / 1506 - 2662 epochs total Iteration 0, loss = 0.0085 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0044 --- Epoch 1169 / 1506 - 2663 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0029 --- Epoch 1170 / 1506 - 2664 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0210 Iteration 80, loss = 0.0054 --- Epoch 1171 / 1506 - 2665 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0027 --- Epoch 1172 / 1506 - 2666 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0032 --- Epoch 1173 / 1506 - 2667 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0055 --- Epoch 1174 / 1506 - 2668 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0049 --- Epoch 1175 / 1506 - 2669 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0042 --- Epoch 1176 / 1506 - 2670 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0066 --- Epoch 1177 / 1506 - 2671 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0050 --- Epoch 1178 / 1506 - 2672 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0033 --- Epoch 1179 / 1506 - 2673 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0061 --- Epoch 1180 / 1506 - 2674 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0085 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0052 --- Epoch 1181 / 1506 - 2675 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0192 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0023 --- Epoch 1182 / 1506 - 2676 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0035 --- Epoch 1183 / 1506 - 2677 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0045 --- Epoch 1184 / 1506 - 2678 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0079 --- Epoch 1185 / 1506 - 2679 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0050 --- Epoch 1186 / 1506 - 2680 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0026 --- Epoch 1187 / 1506 - 2681 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0117 Iteration 80, loss = 0.0026 --- Epoch 1188 / 1506 - 2682 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0082 Iteration 80, loss = 0.0024 --- Epoch 1189 / 1506 - 2683 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0032 --- Epoch 1190 / 1506 - 2684 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0126 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0077 --- Epoch 1191 / 1506 - 2685 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0049 --- Epoch 1192 / 1506 - 2686 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0016 --- Epoch 1193 / 1506 - 2687 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0029 --- Epoch 1194 / 1506 - 2688 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0041 --- Epoch 1195 / 1506 - 2689 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0029 --- Epoch 1196 / 1506 - 2690 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0043 --- Epoch 1197 / 1506 - 2691 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0054 --- Epoch 1198 / 1506 - 2692 epochs total Iteration 0, loss = 0.0096 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0069 --- Epoch 1199 / 1506 - 2693 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0035 --- Epoch 1200 / 1506 - 2694 epochs total Iteration 0, loss = 0.0109 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0140 --- Epoch 1201 / 1506 - 2695 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0036 --- Epoch 1202 / 1506 - 2696 epochs total Iteration 0, loss = 0.0512 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0091 --- Epoch 1203 / 1506 - 2697 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0127 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0029 --- Epoch 1204 / 1506 - 2698 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0045 --- Epoch 1205 / 1506 - 2699 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0031 --- Epoch 1206 / 1506 - 2700 epochs total Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0059 --- Epoch 1207 / 1506 - 2701 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0534 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0028 --- Epoch 1208 / 1506 - 2702 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0029 --- Epoch 1209 / 1506 - 2703 epochs total Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0042 --- Epoch 1210 / 1506 - 2704 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0416 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0026 --- Epoch 1211 / 1506 - 2705 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0025 --- Epoch 1212 / 1506 - 2706 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0045 --- Epoch 1213 / 1506 - 2707 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0056 --- Epoch 1214 / 1506 - 2708 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0085 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0035 --- Epoch 1215 / 1506 - 2709 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0022 --- Epoch 1216 / 1506 - 2710 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0059 --- Epoch 1217 / 1506 - 2711 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0022 --- Epoch 1218 / 1506 - 2712 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0024 --- Epoch 1219 / 1506 - 2713 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0287 Iteration 80, loss = 0.0038 --- Epoch 1220 / 1506 - 2714 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0041 --- Epoch 1221 / 1506 - 2715 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0040 --- Epoch 1222 / 1506 - 2716 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0034 --- Epoch 1223 / 1506 - 2717 epochs total Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0053 --- Epoch 1224 / 1506 - 2718 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0041 --- Epoch 1225 / 1506 - 2719 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0040 --- Epoch 1226 / 1506 - 2720 epochs total Iteration 0, loss = 0.0113 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0050 --- Epoch 1227 / 1506 - 2721 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0067 --- Epoch 1228 / 1506 - 2722 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0043 --- Epoch 1229 / 1506 - 2723 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0029 --- Epoch 1230 / 1506 - 2724 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0038 --- Epoch 1231 / 1506 - 2725 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0059 --- Epoch 1232 / 1506 - 2726 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0021 --- Epoch 1233 / 1506 - 2727 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0059 --- Epoch 1234 / 1506 - 2728 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0080 --- Epoch 1235 / 1506 - 2729 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0058 --- Epoch 1236 / 1506 - 2730 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0042 --- Epoch 1237 / 1506 - 2731 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0101 Iteration 80, loss = 0.0080 --- Epoch 1238 / 1506 - 2732 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0410 Iteration 40, loss = 0.0230 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0015 --- Epoch 1239 / 1506 - 2733 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0130 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0070 --- Epoch 1240 / 1506 - 2734 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0039 --- Epoch 1241 / 1506 - 2735 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0038 --- Epoch 1242 / 1506 - 2736 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0029 --- Epoch 1243 / 1506 - 2737 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0070 --- Epoch 1244 / 1506 - 2738 epochs total Iteration 0, loss = 0.0109 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0050 --- Epoch 1245 / 1506 - 2739 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0063 --- Epoch 1246 / 1506 - 2740 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0040 --- Epoch 1247 / 1506 - 2741 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0056 --- Epoch 1248 / 1506 - 2742 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0056 --- Epoch 1249 / 1506 - 2743 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0047 --- Epoch 1250 / 1506 - 2744 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0035 --- Epoch 1251 / 1506 - 2745 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0025 --- Epoch 1252 / 1506 - 2746 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0067 --- Epoch 1253 / 1506 - 2747 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0035 --- Epoch 1254 / 1506 - 2748 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0084 --- Epoch 1255 / 1506 - 2749 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0073 --- Epoch 1256 / 1506 - 2750 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0150 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0042 --- Epoch 1257 / 1506 - 2751 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0020 --- Epoch 1258 / 1506 - 2752 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0019 --- Epoch 1259 / 1506 - 2753 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0069 --- Epoch 1260 / 1506 - 2754 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0214 Iteration 80, loss = 0.0030 --- Epoch 1261 / 1506 - 2755 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0129 --- Epoch 1262 / 1506 - 2756 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0025 --- Epoch 1263 / 1506 - 2757 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0051 --- Epoch 1264 / 1506 - 2758 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0036 --- Epoch 1265 / 1506 - 2759 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0039 --- Epoch 1266 / 1506 - 2760 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0119 --- Epoch 1267 / 1506 - 2761 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0024 --- Epoch 1268 / 1506 - 2762 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0041 --- Epoch 1269 / 1506 - 2763 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0035 --- Epoch 1270 / 1506 - 2764 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0054 --- Epoch 1271 / 1506 - 2765 epochs total Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0105 --- Epoch 1272 / 1506 - 2766 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0022 --- Epoch 1273 / 1506 - 2767 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0130 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0043 --- Epoch 1274 / 1506 - 2768 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0718 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0026 --- Epoch 1275 / 1506 - 2769 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0028 --- Epoch 1276 / 1506 - 2770 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0035 --- Epoch 1277 / 1506 - 2771 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0148 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0024 --- Epoch 1278 / 1506 - 2772 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0058 --- Epoch 1279 / 1506 - 2773 epochs total Iteration 0, loss = 0.0097 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0060 --- Epoch 1280 / 1506 - 2774 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0111 --- Epoch 1281 / 1506 - 2775 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0184 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0027 --- Epoch 1282 / 1506 - 2776 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0093 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0021 --- Epoch 1283 / 1506 - 2777 epochs total Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0044 --- Epoch 1284 / 1506 - 2778 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0039 --- Epoch 1285 / 1506 - 2779 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0127 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0031 --- Epoch 1286 / 1506 - 2780 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0057 --- Epoch 1287 / 1506 - 2781 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0026 --- Epoch 1288 / 1506 - 2782 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0035 --- Epoch 1289 / 1506 - 2783 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0106 --- Epoch 1290 / 1506 - 2784 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0061 --- Epoch 1291 / 1506 - 2785 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0028 --- Epoch 1292 / 1506 - 2786 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0028 --- Epoch 1293 / 1506 - 2787 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0029 --- Epoch 1294 / 1506 - 2788 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0033 --- Epoch 1295 / 1506 - 2789 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0031 --- Epoch 1296 / 1506 - 2790 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0087 --- Epoch 1297 / 1506 - 2791 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0035 --- Epoch 1298 / 1506 - 2792 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0019 --- Epoch 1299 / 1506 - 2793 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0043 --- Epoch 1300 / 1506 - 2794 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0039 --- Epoch 1301 / 1506 - 2795 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0030 --- Epoch 1302 / 1506 - 2796 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0090 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0131 Iteration 80, loss = 0.0034 --- Epoch 1303 / 1506 - 2797 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0222 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0063 --- Epoch 1304 / 1506 - 2798 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0073 --- Epoch 1305 / 1506 - 2799 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0184 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0025 --- Epoch 1306 / 1506 - 2800 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0151 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0053 --- Epoch 1307 / 1506 - 2801 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0056 --- Epoch 1308 / 1506 - 2802 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0031 --- Epoch 1309 / 1506 - 2803 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0050 --- Epoch 1310 / 1506 - 2804 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0018 --- Epoch 1311 / 1506 - 2805 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0082 Iteration 80, loss = 0.0035 --- Epoch 1312 / 1506 - 2806 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0059 --- Epoch 1313 / 1506 - 2807 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0017 --- Epoch 1314 / 1506 - 2808 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0011 --- Epoch 1315 / 1506 - 2809 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0037 --- Epoch 1316 / 1506 - 2810 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0028 --- Epoch 1317 / 1506 - 2811 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0037 --- Epoch 1318 / 1506 - 2812 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0025 --- Epoch 1319 / 1506 - 2813 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0026 --- Epoch 1320 / 1506 - 2814 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0074 --- Epoch 1321 / 1506 - 2815 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0027 --- Epoch 1322 / 1506 - 2816 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0058 --- Epoch 1323 / 1506 - 2817 epochs total Iteration 0, loss = 0.0124 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0027 --- Epoch 1324 / 1506 - 2818 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0041 --- Epoch 1325 / 1506 - 2819 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0065 --- Epoch 1326 / 1506 - 2820 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0039 --- Epoch 1327 / 1506 - 2821 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0044 --- Epoch 1328 / 1506 - 2822 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0114 Iteration 80, loss = 0.0022 --- Epoch 1329 / 1506 - 2823 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0065 --- Epoch 1330 / 1506 - 2824 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0086 --- Epoch 1331 / 1506 - 2825 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0138 --- Epoch 1332 / 1506 - 2826 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0033 --- Epoch 1333 / 1506 - 2827 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0042 --- Epoch 1334 / 1506 - 2828 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0089 --- Epoch 1335 / 1506 - 2829 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0226 --- Epoch 1336 / 1506 - 2830 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0060 --- Epoch 1337 / 1506 - 2831 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0035 --- Epoch 1338 / 1506 - 2832 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0035 --- Epoch 1339 / 1506 - 2833 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0017 --- Epoch 1340 / 1506 - 2834 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0045 --- Epoch 1341 / 1506 - 2835 epochs total Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0095 --- Epoch 1342 / 1506 - 2836 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0022 --- Epoch 1343 / 1506 - 2837 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0042 --- Epoch 1344 / 1506 - 2838 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0076 --- Epoch 1345 / 1506 - 2839 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0036 --- Epoch 1346 / 1506 - 2840 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0032 --- Epoch 1347 / 1506 - 2841 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0039 --- Epoch 1348 / 1506 - 2842 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0065 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0017 --- Epoch 1349 / 1506 - 2843 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0023 --- Epoch 1350 / 1506 - 2844 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0021 --- Epoch 1351 / 1506 - 2845 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0034 --- Epoch 1352 / 1506 - 2846 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0038 --- Epoch 1353 / 1506 - 2847 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0063 --- Epoch 1354 / 1506 - 2848 epochs total Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0036 --- Epoch 1355 / 1506 - 2849 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0046 --- Epoch 1356 / 1506 - 2850 epochs total Iteration 0, loss = 0.0127 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0048 --- Epoch 1357 / 1506 - 2851 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0082 --- Epoch 1358 / 1506 - 2852 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0065 --- Epoch 1359 / 1506 - 2853 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0135 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0023 --- Epoch 1360 / 1506 - 2854 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0020 --- Epoch 1361 / 1506 - 2855 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0053 --- Epoch 1362 / 1506 - 2856 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0028 --- Epoch 1363 / 1506 - 2857 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0042 --- Epoch 1364 / 1506 - 2858 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0064 --- Epoch 1365 / 1506 - 2859 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0052 --- Epoch 1366 / 1506 - 2860 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0043 --- Epoch 1367 / 1506 - 2861 epochs total Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0047 --- Epoch 1368 / 1506 - 2862 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0036 --- Epoch 1369 / 1506 - 2863 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0018 --- Epoch 1370 / 1506 - 2864 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0136 --- Epoch 1371 / 1506 - 2865 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0043 --- Epoch 1372 / 1506 - 2866 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0022 --- Epoch 1373 / 1506 - 2867 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0065 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0038 --- Epoch 1374 / 1506 - 2868 epochs total Iteration 0, loss = 0.0101 Iteration 20, loss = 0.0161 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0032 --- Epoch 1375 / 1506 - 2869 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0027 --- Epoch 1376 / 1506 - 2870 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0112 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0030 --- Epoch 1377 / 1506 - 2871 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0039 --- Epoch 1378 / 1506 - 2872 epochs total Iteration 0, loss = 0.0082 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0034 --- Epoch 1379 / 1506 - 2873 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0397 --- Epoch 1380 / 1506 - 2874 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0044 --- Epoch 1381 / 1506 - 2875 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0084 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0035 --- Epoch 1382 / 1506 - 2876 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0223 --- Epoch 1383 / 1506 - 2877 epochs total Iteration 0, loss = 0.0332 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0072 --- Epoch 1384 / 1506 - 2878 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0029 --- Epoch 1385 / 1506 - 2879 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0037 --- Epoch 1386 / 1506 - 2880 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0054 --- Epoch 1387 / 1506 - 2881 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0040 --- Epoch 1388 / 1506 - 2882 epochs total Iteration 0, loss = 0.0159 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0068 --- Epoch 1389 / 1506 - 2883 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0036 --- Epoch 1390 / 1506 - 2884 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0170 --- Epoch 1391 / 1506 - 2885 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0150 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0022 --- Epoch 1392 / 1506 - 2886 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0041 --- Epoch 1393 / 1506 - 2887 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0022 --- Epoch 1394 / 1506 - 2888 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0033 --- Epoch 1395 / 1506 - 2889 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0040 --- Epoch 1396 / 1506 - 2890 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0097 --- Epoch 1397 / 1506 - 2891 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0022 --- Epoch 1398 / 1506 - 2892 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0039 --- Epoch 1399 / 1506 - 2893 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0055 --- Epoch 1400 / 1506 - 2894 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0037 --- Epoch 1401 / 1506 - 2895 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0042 --- Epoch 1402 / 1506 - 2896 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0147 --- Epoch 1403 / 1506 - 2897 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0042 --- Epoch 1404 / 1506 - 2898 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0028 --- Epoch 1405 / 1506 - 2899 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0026 --- Epoch 1406 / 1506 - 2900 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0125 --- Epoch 1407 / 1506 - 2901 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0193 --- Epoch 1408 / 1506 - 2902 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0054 --- Epoch 1409 / 1506 - 2903 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0035 --- Epoch 1410 / 1506 - 2904 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0031 --- Epoch 1411 / 1506 - 2905 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0043 --- Epoch 1412 / 1506 - 2906 epochs total Iteration 0, loss = 0.0407 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0036 --- Epoch 1413 / 1506 - 2907 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0047 --- Epoch 1414 / 1506 - 2908 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0148 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0028 --- Epoch 1415 / 1506 - 2909 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0031 --- Epoch 1416 / 1506 - 2910 epochs total Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0292 Iteration 80, loss = 0.0050 --- Epoch 1417 / 1506 - 2911 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0134 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0049 --- Epoch 1418 / 1506 - 2912 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0113 Iteration 80, loss = 0.0055 --- Epoch 1419 / 1506 - 2913 epochs total Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0026 --- Epoch 1420 / 1506 - 2914 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0200 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0096 --- Epoch 1421 / 1506 - 2915 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0025 --- Epoch 1422 / 1506 - 2916 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0027 --- Epoch 1423 / 1506 - 2917 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0024 --- Epoch 1424 / 1506 - 2918 epochs total Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0025 --- Epoch 1425 / 1506 - 2919 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0141 Iteration 40, loss = 0.0124 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0083 --- Epoch 1426 / 1506 - 2920 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0123 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0058 --- Epoch 1427 / 1506 - 2921 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0034 --- Epoch 1428 / 1506 - 2922 epochs total Iteration 0, loss = 0.0109 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0052 --- Epoch 1429 / 1506 - 2923 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0088 --- Epoch 1430 / 1506 - 2924 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0044 --- Epoch 1431 / 1506 - 2925 epochs total Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0053 --- Epoch 1432 / 1506 - 2926 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0022 --- Epoch 1433 / 1506 - 2927 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0013 --- Epoch 1434 / 1506 - 2928 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0039 --- Epoch 1435 / 1506 - 2929 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0099 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0059 --- Epoch 1436 / 1506 - 2930 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0153 --- Epoch 1437 / 1506 - 2931 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0048 --- Epoch 1438 / 1506 - 2932 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0017 --- Epoch 1439 / 1506 - 2933 epochs total Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0022 --- Epoch 1440 / 1506 - 2934 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0023 --- Epoch 1441 / 1506 - 2935 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0036 --- Epoch 1442 / 1506 - 2936 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0026 --- Epoch 1443 / 1506 - 2937 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0026 --- Epoch 1444 / 1506 - 2938 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0059 --- Epoch 1445 / 1506 - 2939 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0032 --- Epoch 1446 / 1506 - 2940 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0067 --- Epoch 1447 / 1506 - 2941 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0086 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0050 --- Epoch 1448 / 1506 - 2942 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0033 --- Epoch 1449 / 1506 - 2943 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0098 --- Epoch 1450 / 1506 - 2944 epochs total Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0022 --- Epoch 1451 / 1506 - 2945 epochs total Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0017 --- Epoch 1452 / 1506 - 2946 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0029 --- Epoch 1453 / 1506 - 2947 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0097 --- Epoch 1454 / 1506 - 2948 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0027 --- Epoch 1455 / 1506 - 2949 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0030 --- Epoch 1456 / 1506 - 2950 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0020 --- Epoch 1457 / 1506 - 2951 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0046 --- Epoch 1458 / 1506 - 2952 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0099 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0018 --- Epoch 1459 / 1506 - 2953 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0070 --- Epoch 1460 / 1506 - 2954 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0023 --- Epoch 1461 / 1506 - 2955 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0139 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0281 --- Epoch 1462 / 1506 - 2956 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0088 --- Epoch 1463 / 1506 - 2957 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0048 --- Epoch 1464 / 1506 - 2958 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0025 --- Epoch 1465 / 1506 - 2959 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0031 --- Epoch 1466 / 1506 - 2960 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0028 --- Epoch 1467 / 1506 - 2961 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0025 --- Epoch 1468 / 1506 - 2962 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0087 --- Epoch 1469 / 1506 - 2963 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0036 --- Epoch 1470 / 1506 - 2964 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0064 --- Epoch 1471 / 1506 - 2965 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0030 --- Epoch 1472 / 1506 - 2966 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0070 --- Epoch 1473 / 1506 - 2967 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0092 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0023 --- Epoch 1474 / 1506 - 2968 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0035 --- Epoch 1475 / 1506 - 2969 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0026 --- Epoch 1476 / 1506 - 2970 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0280 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0076 --- Epoch 1477 / 1506 - 2971 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0040 --- Epoch 1478 / 1506 - 2972 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0037 --- Epoch 1479 / 1506 - 2973 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0015 --- Epoch 1480 / 1506 - 2974 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0028 --- Epoch 1481 / 1506 - 2975 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0031 --- Epoch 1482 / 1506 - 2976 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0020 --- Epoch 1483 / 1506 - 2977 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0078 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0031 --- Epoch 1484 / 1506 - 2978 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0044 --- Epoch 1485 / 1506 - 2979 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0037 --- Epoch 1486 / 1506 - 2980 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0033 --- Epoch 1487 / 1506 - 2981 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0041 --- Epoch 1488 / 1506 - 2982 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0086 --- Epoch 1489 / 1506 - 2983 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0022 --- Epoch 1490 / 1506 - 2984 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0045 --- Epoch 1491 / 1506 - 2985 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0041 --- Epoch 1492 / 1506 - 2986 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0111 Iteration 80, loss = 0.0059 --- Epoch 1493 / 1506 - 2987 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0023 --- Epoch 1494 / 1506 - 2988 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0058 --- Epoch 1495 / 1506 - 2989 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0118 --- Epoch 1496 / 1506 - 2990 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0054 --- Epoch 1497 / 1506 - 2991 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0253 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0024 --- Epoch 1498 / 1506 - 2992 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0047 --- Epoch 1499 / 1506 - 2993 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0011 --- Epoch 1500 / 1506 - 2994 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0178 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0043 --- Epoch 1501 / 1506 - 2995 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0087 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0021 --- Epoch 1502 / 1506 - 2996 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0534 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0100 --- Epoch 1503 / 1506 - 2997 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0030 --- Epoch 1504 / 1506 - 2998 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0057 --- Epoch 1505 / 1506 - 2999 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0016 --- Epoch 1506 / 1506 - 3000 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0061
testModel(model12, x_test=data["X_test_horse"], y_test=data["y_test_horse"], criterion=nn.MSELoss())
learning_rate = 1e-2
model13 = ConvNet4()
optimizer = optim.SGD(model13.parameters(), lr=learning_rate)
train(model13, optimizer, epochs=1369, x_train=data["X_train_truck"], y_train=data["y_train_truck"], criterion=nn.MSELoss())
--- Epoch 1 / 1369 - 1634 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0030 --- Epoch 2 / 1369 - 1635 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0008 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0036 --- Epoch 3 / 1369 - 1636 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0037 --- Epoch 4 / 1369 - 1637 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0020 --- Epoch 5 / 1369 - 1638 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0046 --- Epoch 6 / 1369 - 1639 epochs total Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0054 --- Epoch 7 / 1369 - 1640 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0093 --- Epoch 8 / 1369 - 1641 epochs total Iteration 0, loss = 0.0006 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0140 Iteration 80, loss = 0.0132 --- Epoch 9 / 1369 - 1642 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0010 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0015 --- Epoch 10 / 1369 - 1643 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0010 Iteration 80, loss = 0.0185 --- Epoch 11 / 1369 - 1644 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0252 Iteration 80, loss = 0.0018 --- Epoch 12 / 1369 - 1645 epochs total Iteration 0, loss = 0.0158 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0027 --- Epoch 13 / 1369 - 1646 epochs total Iteration 0, loss = 0.0227 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0014 --- Epoch 14 / 1369 - 1647 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0013 --- Epoch 15 / 1369 - 1648 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0065 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0031 --- Epoch 16 / 1369 - 1649 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0122 --- Epoch 17 / 1369 - 1650 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0199 --- Epoch 18 / 1369 - 1651 epochs total Iteration 0, loss = 0.0127 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0014 --- Epoch 19 / 1369 - 1652 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0012 --- Epoch 20 / 1369 - 1653 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0286 --- Epoch 21 / 1369 - 1654 epochs total Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0021 --- Epoch 22 / 1369 - 1655 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0009 Iteration 80, loss = 0.0036 --- Epoch 23 / 1369 - 1656 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0042 --- Epoch 24 / 1369 - 1657 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0015 --- Epoch 25 / 1369 - 1658 epochs total Iteration 0, loss = 0.0010 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0121 Iteration 60, loss = 0.0180 Iteration 80, loss = 0.0123 --- Epoch 26 / 1369 - 1659 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0150 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0164 --- Epoch 27 / 1369 - 1660 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0026 --- Epoch 28 / 1369 - 1661 epochs total Iteration 0, loss = 0.0172 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0043 --- Epoch 29 / 1369 - 1662 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0005 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0051 --- Epoch 30 / 1369 - 1663 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0122 --- Epoch 31 / 1369 - 1664 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0178 Iteration 80, loss = 0.0029 --- Epoch 32 / 1369 - 1665 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0019 --- Epoch 33 / 1369 - 1666 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0171 --- Epoch 34 / 1369 - 1667 epochs total Iteration 0, loss = 0.0202 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0081 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0054 --- Epoch 35 / 1369 - 1668 epochs total Iteration 0, loss = 0.0008 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0047 --- Epoch 36 / 1369 - 1669 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0043 --- Epoch 37 / 1369 - 1670 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0082 Iteration 80, loss = 0.0033 --- Epoch 38 / 1369 - 1671 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0061 --- Epoch 39 / 1369 - 1672 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0088 --- Epoch 40 / 1369 - 1673 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0279 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0128 --- Epoch 41 / 1369 - 1674 epochs total Iteration 0, loss = 0.0110 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0127 Iteration 80, loss = 0.0015 --- Epoch 42 / 1369 - 1675 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0012 --- Epoch 43 / 1369 - 1676 epochs total Iteration 0, loss = 0.0008 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0012 --- Epoch 44 / 1369 - 1677 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0058 --- Epoch 45 / 1369 - 1678 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0081 --- Epoch 46 / 1369 - 1679 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0059 --- Epoch 47 / 1369 - 1680 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0005 Iteration 80, loss = 0.0042 --- Epoch 48 / 1369 - 1681 epochs total Iteration 0, loss = 0.0082 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0072 --- Epoch 49 / 1369 - 1682 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0096 Iteration 80, loss = 0.0041 --- Epoch 50 / 1369 - 1683 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0010 --- Epoch 51 / 1369 - 1684 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0118 --- Epoch 52 / 1369 - 1685 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0042 --- Epoch 53 / 1369 - 1686 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0031 --- Epoch 54 / 1369 - 1687 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0025 --- Epoch 55 / 1369 - 1688 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0005 --- Epoch 56 / 1369 - 1689 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0127 Iteration 80, loss = 0.0027 --- Epoch 57 / 1369 - 1690 epochs total Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0037 --- Epoch 58 / 1369 - 1691 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0029 --- Epoch 59 / 1369 - 1692 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0013 --- Epoch 60 / 1369 - 1693 epochs total Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0169 --- Epoch 61 / 1369 - 1694 epochs total Iteration 0, loss = 0.0199 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0034 --- Epoch 62 / 1369 - 1695 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0089 --- Epoch 63 / 1369 - 1696 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0188 --- Epoch 64 / 1369 - 1697 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0009 Iteration 80, loss = 0.0048 --- Epoch 65 / 1369 - 1698 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0205 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0052 --- Epoch 66 / 1369 - 1699 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0009 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0025 --- Epoch 67 / 1369 - 1700 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0092 --- Epoch 68 / 1369 - 1701 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0008 Iteration 40, loss = 0.0140 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0064 --- Epoch 69 / 1369 - 1702 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0008 Iteration 60, loss = 0.0252 Iteration 80, loss = 0.0076 --- Epoch 70 / 1369 - 1703 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0008 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0056 --- Epoch 71 / 1369 - 1704 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0005 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0028 --- Epoch 72 / 1369 - 1705 epochs total Iteration 0, loss = 0.0007 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0082 Iteration 80, loss = 0.0024 --- Epoch 73 / 1369 - 1706 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0093 --- Epoch 74 / 1369 - 1707 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0052 --- Epoch 75 / 1369 - 1708 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0158 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0034 --- Epoch 76 / 1369 - 1709 epochs total Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0016 --- Epoch 77 / 1369 - 1710 epochs total Iteration 0, loss = 0.0296 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0041 --- Epoch 78 / 1369 - 1711 epochs total Iteration 0, loss = 0.0082 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0018 --- Epoch 79 / 1369 - 1712 epochs total Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0051 --- Epoch 80 / 1369 - 1713 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0185 Iteration 80, loss = 0.0066 --- Epoch 81 / 1369 - 1714 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0190 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0068 --- Epoch 82 / 1369 - 1715 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0244 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0062 --- Epoch 83 / 1369 - 1716 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0007 --- Epoch 84 / 1369 - 1717 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0053 --- Epoch 85 / 1369 - 1718 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0131 --- Epoch 86 / 1369 - 1719 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0015 --- Epoch 87 / 1369 - 1720 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0029 --- Epoch 88 / 1369 - 1721 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0011 --- Epoch 89 / 1369 - 1722 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0082 --- Epoch 90 / 1369 - 1723 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0146 Iteration 80, loss = 0.0008 --- Epoch 91 / 1369 - 1724 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0034 --- Epoch 92 / 1369 - 1725 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0005 Iteration 40, loss = 0.0114 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0029 --- Epoch 93 / 1369 - 1726 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0010 --- Epoch 94 / 1369 - 1727 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0145 Iteration 80, loss = 0.0021 --- Epoch 95 / 1369 - 1728 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0117 Iteration 40, loss = 0.0210 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0029 --- Epoch 96 / 1369 - 1729 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0093 --- Epoch 97 / 1369 - 1730 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0015 --- Epoch 98 / 1369 - 1731 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0027 --- Epoch 99 / 1369 - 1732 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0016 --- Epoch 100 / 1369 - 1733 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0085 Iteration 80, loss = 0.0153 --- Epoch 101 / 1369 - 1734 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0025 --- Epoch 102 / 1369 - 1735 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0171 Iteration 80, loss = 0.0105 --- Epoch 103 / 1369 - 1736 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0007 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0019 --- Epoch 104 / 1369 - 1737 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0020 --- Epoch 105 / 1369 - 1738 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0050 --- Epoch 106 / 1369 - 1739 epochs total Iteration 0, loss = 0.0006 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0014 --- Epoch 107 / 1369 - 1740 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0145 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0192 Iteration 80, loss = 0.0024 --- Epoch 108 / 1369 - 1741 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0138 --- Epoch 109 / 1369 - 1742 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0085 Iteration 80, loss = 0.0055 --- Epoch 110 / 1369 - 1743 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0090 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0015 --- Epoch 111 / 1369 - 1744 epochs total Iteration 0, loss = 0.0010 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0057 --- Epoch 112 / 1369 - 1745 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0088 --- Epoch 113 / 1369 - 1746 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0121 Iteration 80, loss = 0.0025 --- Epoch 114 / 1369 - 1747 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0023 --- Epoch 115 / 1369 - 1748 epochs total Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0206 --- Epoch 116 / 1369 - 1749 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0240 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0054 --- Epoch 117 / 1369 - 1750 epochs total Iteration 0, loss = 0.0139 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0010 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0075 --- Epoch 118 / 1369 - 1751 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0332 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0045 --- Epoch 119 / 1369 - 1752 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0149 --- Epoch 120 / 1369 - 1753 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0114 Iteration 80, loss = 0.0018 --- Epoch 121 / 1369 - 1754 epochs total Iteration 0, loss = 0.0204 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0192 --- Epoch 122 / 1369 - 1755 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0035 --- Epoch 123 / 1369 - 1756 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0035 --- Epoch 124 / 1369 - 1757 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0036 --- Epoch 125 / 1369 - 1758 epochs total Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0134 --- Epoch 126 / 1369 - 1759 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0175 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0012 --- Epoch 127 / 1369 - 1760 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0033 --- Epoch 128 / 1369 - 1761 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0074 --- Epoch 129 / 1369 - 1762 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0034 --- Epoch 130 / 1369 - 1763 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0078 --- Epoch 131 / 1369 - 1764 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0279 Iteration 80, loss = 0.0081 --- Epoch 132 / 1369 - 1765 epochs total Iteration 0, loss = 0.0070 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0021 --- Epoch 133 / 1369 - 1766 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0013 --- Epoch 134 / 1369 - 1767 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0158 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0065 --- Epoch 135 / 1369 - 1768 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0007 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0016 --- Epoch 136 / 1369 - 1769 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0278 Iteration 40, loss = 0.0088 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0038 --- Epoch 137 / 1369 - 1770 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0048 --- Epoch 138 / 1369 - 1771 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0029 --- Epoch 139 / 1369 - 1772 epochs total Iteration 0, loss = 0.0150 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0042 --- Epoch 140 / 1369 - 1773 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0010 Iteration 80, loss = 0.0133 --- Epoch 141 / 1369 - 1774 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0091 --- Epoch 142 / 1369 - 1775 epochs total Iteration 0, loss = 0.0137 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0096 --- Epoch 143 / 1369 - 1776 epochs total Iteration 0, loss = 0.0097 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0019 --- Epoch 144 / 1369 - 1777 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0013 --- Epoch 145 / 1369 - 1778 epochs total Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0021 --- Epoch 146 / 1369 - 1779 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0018 --- Epoch 147 / 1369 - 1780 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0105 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0077 --- Epoch 148 / 1369 - 1781 epochs total Iteration 0, loss = 0.0235 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0061 --- Epoch 149 / 1369 - 1782 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0083 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0061 --- Epoch 150 / 1369 - 1783 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0206 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0049 --- Epoch 151 / 1369 - 1784 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0209 --- Epoch 152 / 1369 - 1785 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0008 Iteration 80, loss = 0.0022 --- Epoch 153 / 1369 - 1786 epochs total Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0040 --- Epoch 154 / 1369 - 1787 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0039 --- Epoch 155 / 1369 - 1788 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0224 Iteration 80, loss = 0.0034 --- Epoch 156 / 1369 - 1789 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0016 --- Epoch 157 / 1369 - 1790 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0041 --- Epoch 158 / 1369 - 1791 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0088 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0025 --- Epoch 159 / 1369 - 1792 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0397 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0170 --- Epoch 160 / 1369 - 1793 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0088 --- Epoch 161 / 1369 - 1794 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0053 --- Epoch 162 / 1369 - 1795 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0086 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0088 --- Epoch 163 / 1369 - 1796 epochs total Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0096 Iteration 80, loss = 0.0040 --- Epoch 164 / 1369 - 1797 epochs total Iteration 0, loss = 0.0256 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0044 --- Epoch 165 / 1369 - 1798 epochs total Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0073 --- Epoch 166 / 1369 - 1799 epochs total Iteration 0, loss = 0.0130 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0120 --- Epoch 167 / 1369 - 1800 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0138 --- Epoch 168 / 1369 - 1801 epochs total Iteration 0, loss = 0.0137 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0034 --- Epoch 169 / 1369 - 1802 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0087 --- Epoch 170 / 1369 - 1803 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0240 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0024 --- Epoch 171 / 1369 - 1804 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0008 --- Epoch 172 / 1369 - 1805 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0151 --- Epoch 173 / 1369 - 1806 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0127 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0034 --- Epoch 174 / 1369 - 1807 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0010 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0038 --- Epoch 175 / 1369 - 1808 epochs total Iteration 0, loss = 0.0096 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0075 --- Epoch 176 / 1369 - 1809 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0006 Iteration 60, loss = 0.0196 Iteration 80, loss = 0.0082 --- Epoch 177 / 1369 - 1810 epochs total Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0082 Iteration 80, loss = 0.0071 --- Epoch 178 / 1369 - 1811 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0060 --- Epoch 179 / 1369 - 1812 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0261 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0048 --- Epoch 180 / 1369 - 1813 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0211 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0119 --- Epoch 181 / 1369 - 1814 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0088 --- Epoch 182 / 1369 - 1815 epochs total Iteration 0, loss = 0.0139 Iteration 20, loss = 0.0146 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0015 --- Epoch 183 / 1369 - 1816 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0054 --- Epoch 184 / 1369 - 1817 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0026 --- Epoch 185 / 1369 - 1818 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0170 Iteration 80, loss = 0.0129 --- Epoch 186 / 1369 - 1819 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0027 --- Epoch 187 / 1369 - 1820 epochs total Iteration 0, loss = 0.0100 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0081 --- Epoch 188 / 1369 - 1821 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0029 --- Epoch 189 / 1369 - 1822 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0162 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0023 --- Epoch 190 / 1369 - 1823 epochs total Iteration 0, loss = 0.0211 Iteration 20, loss = 0.0151 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0025 --- Epoch 191 / 1369 - 1824 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0101 --- Epoch 192 / 1369 - 1825 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0168 Iteration 80, loss = 0.0067 --- Epoch 193 / 1369 - 1826 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0116 --- Epoch 194 / 1369 - 1827 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0035 --- Epoch 195 / 1369 - 1828 epochs total Iteration 0, loss = 0.0007 Iteration 20, loss = 0.0065 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0030 --- Epoch 196 / 1369 - 1829 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0067 --- Epoch 197 / 1369 - 1830 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0020 --- Epoch 198 / 1369 - 1831 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0139 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0128 --- Epoch 199 / 1369 - 1832 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0010 Iteration 80, loss = 0.0021 --- Epoch 200 / 1369 - 1833 epochs total Iteration 0, loss = 0.0281 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0058 --- Epoch 201 / 1369 - 1834 epochs total Iteration 0, loss = 0.0103 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0080 --- Epoch 202 / 1369 - 1835 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0100 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0019 --- Epoch 203 / 1369 - 1836 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0090 Iteration 40, loss = 0.0242 Iteration 60, loss = 0.0010 Iteration 80, loss = 0.0104 --- Epoch 204 / 1369 - 1837 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0126 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0054 --- Epoch 205 / 1369 - 1838 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0187 Iteration 80, loss = 0.0110 --- Epoch 206 / 1369 - 1839 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0055 --- Epoch 207 / 1369 - 1840 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0111 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0037 --- Epoch 208 / 1369 - 1841 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0099 Iteration 40, loss = 0.0282 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0013 --- Epoch 209 / 1369 - 1842 epochs total Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0041 --- Epoch 210 / 1369 - 1843 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0150 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0083 --- Epoch 211 / 1369 - 1844 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0132 Iteration 80, loss = 0.0091 --- Epoch 212 / 1369 - 1845 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0062 --- Epoch 213 / 1369 - 1846 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0046 --- Epoch 214 / 1369 - 1847 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0310 Iteration 80, loss = 0.0021 --- Epoch 215 / 1369 - 1848 epochs total Iteration 0, loss = 0.0130 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0379 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0074 --- Epoch 216 / 1369 - 1849 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0017 --- Epoch 217 / 1369 - 1850 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0085 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0130 --- Epoch 218 / 1369 - 1851 epochs total Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0094 --- Epoch 219 / 1369 - 1852 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0030 --- Epoch 220 / 1369 - 1853 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0020 --- Epoch 221 / 1369 - 1854 epochs total Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0024 --- Epoch 222 / 1369 - 1855 epochs total Iteration 0, loss = 0.0007 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0063 --- Epoch 223 / 1369 - 1856 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0094 --- Epoch 224 / 1369 - 1857 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0164 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0046 --- Epoch 225 / 1369 - 1858 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0088 --- Epoch 226 / 1369 - 1859 epochs total Iteration 0, loss = 0.0005 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0060 --- Epoch 227 / 1369 - 1860 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0014 --- Epoch 228 / 1369 - 1861 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0050 --- Epoch 229 / 1369 - 1862 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0011 --- Epoch 230 / 1369 - 1863 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0095 --- Epoch 231 / 1369 - 1864 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0092 --- Epoch 232 / 1369 - 1865 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0027 --- Epoch 233 / 1369 - 1866 epochs total Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0029 --- Epoch 234 / 1369 - 1867 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0026 --- Epoch 235 / 1369 - 1868 epochs total Iteration 0, loss = 0.0206 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0021 --- Epoch 236 / 1369 - 1869 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0078 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0023 --- Epoch 237 / 1369 - 1870 epochs total Iteration 0, loss = 0.0168 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0069 --- Epoch 238 / 1369 - 1871 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0008 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0037 --- Epoch 239 / 1369 - 1872 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0018 --- Epoch 240 / 1369 - 1873 epochs total Iteration 0, loss = 0.0182 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0019 --- Epoch 241 / 1369 - 1874 epochs total Iteration 0, loss = 0.0004 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0078 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0042 --- Epoch 242 / 1369 - 1875 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0035 --- Epoch 243 / 1369 - 1876 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0028 --- Epoch 244 / 1369 - 1877 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0014 --- Epoch 245 / 1369 - 1878 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0029 --- Epoch 246 / 1369 - 1879 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0095 --- Epoch 247 / 1369 - 1880 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0008 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0026 --- Epoch 248 / 1369 - 1881 epochs total Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0013 --- Epoch 249 / 1369 - 1882 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0005 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0046 --- Epoch 250 / 1369 - 1883 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0105 --- Epoch 251 / 1369 - 1884 epochs total Iteration 0, loss = 0.0010 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0134 --- Epoch 252 / 1369 - 1885 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0012 --- Epoch 253 / 1369 - 1886 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0009 --- Epoch 254 / 1369 - 1887 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0045 --- Epoch 255 / 1369 - 1888 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0034 --- Epoch 256 / 1369 - 1889 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0079 --- Epoch 257 / 1369 - 1890 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0042 --- Epoch 258 / 1369 - 1891 epochs total Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0157 Iteration 80, loss = 0.0077 --- Epoch 259 / 1369 - 1892 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0017 --- Epoch 260 / 1369 - 1893 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0081 --- Epoch 261 / 1369 - 1894 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0047 --- Epoch 262 / 1369 - 1895 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0106 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0045 --- Epoch 263 / 1369 - 1896 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0081 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0029 --- Epoch 264 / 1369 - 1897 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0022 --- Epoch 265 / 1369 - 1898 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0019 --- Epoch 266 / 1369 - 1899 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0128 Iteration 80, loss = 0.0012 --- Epoch 267 / 1369 - 1900 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0174 Iteration 80, loss = 0.0045 --- Epoch 268 / 1369 - 1901 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0207 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0043 --- Epoch 269 / 1369 - 1902 epochs total Iteration 0, loss = 0.0284 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0163 Iteration 80, loss = 0.0041 --- Epoch 270 / 1369 - 1903 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0021 --- Epoch 271 / 1369 - 1904 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0092 --- Epoch 272 / 1369 - 1905 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0310 --- Epoch 273 / 1369 - 1906 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0018 --- Epoch 274 / 1369 - 1907 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0096 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0058 --- Epoch 275 / 1369 - 1908 epochs total Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0116 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0008 Iteration 80, loss = 0.0035 --- Epoch 276 / 1369 - 1909 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0019 --- Epoch 277 / 1369 - 1910 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0116 Iteration 80, loss = 0.0041 --- Epoch 278 / 1369 - 1911 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0023 --- Epoch 279 / 1369 - 1912 epochs total Iteration 0, loss = 0.0100 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0161 Iteration 80, loss = 0.0019 --- Epoch 280 / 1369 - 1913 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0015 --- Epoch 281 / 1369 - 1914 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0074 --- Epoch 282 / 1369 - 1915 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0137 Iteration 80, loss = 0.0064 --- Epoch 283 / 1369 - 1916 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0112 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0040 --- Epoch 284 / 1369 - 1917 epochs total Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0026 --- Epoch 285 / 1369 - 1918 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0250 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0025 --- Epoch 286 / 1369 - 1919 epochs total Iteration 0, loss = 0.0150 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0074 --- Epoch 287 / 1369 - 1920 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0022 --- Epoch 288 / 1369 - 1921 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0005 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0038 --- Epoch 289 / 1369 - 1922 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0019 --- Epoch 290 / 1369 - 1923 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0046 --- Epoch 291 / 1369 - 1924 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0235 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0083 Iteration 80, loss = 0.0053 --- Epoch 292 / 1369 - 1925 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0009 Iteration 80, loss = 0.0056 --- Epoch 293 / 1369 - 1926 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0010 Iteration 80, loss = 0.0073 --- Epoch 294 / 1369 - 1927 epochs total Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0031 --- Epoch 295 / 1369 - 1928 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0020 --- Epoch 296 / 1369 - 1929 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0033 --- Epoch 297 / 1369 - 1930 epochs total Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0017 --- Epoch 298 / 1369 - 1931 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0173 --- Epoch 299 / 1369 - 1932 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0015 --- Epoch 300 / 1369 - 1933 epochs total Iteration 0, loss = 0.0116 Iteration 20, loss = 0.0008 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0010 --- Epoch 301 / 1369 - 1934 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0125 --- Epoch 302 / 1369 - 1935 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0029 --- Epoch 303 / 1369 - 1936 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0051 --- Epoch 304 / 1369 - 1937 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0068 --- Epoch 305 / 1369 - 1938 epochs total Iteration 0, loss = 0.0100 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0015 --- Epoch 306 / 1369 - 1939 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0032 --- Epoch 307 / 1369 - 1940 epochs total Iteration 0, loss = 0.0135 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0057 --- Epoch 308 / 1369 - 1941 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0178 --- Epoch 309 / 1369 - 1942 epochs total Iteration 0, loss = 0.0310 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0006 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0032 --- Epoch 310 / 1369 - 1943 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0025 --- Epoch 311 / 1369 - 1944 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0076 --- Epoch 312 / 1369 - 1945 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0073 --- Epoch 313 / 1369 - 1946 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0100 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0076 --- Epoch 314 / 1369 - 1947 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0011 Iteration 80, loss = 0.0009 --- Epoch 315 / 1369 - 1948 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0016 --- Epoch 316 / 1369 - 1949 epochs total Iteration 0, loss = 0.0232 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0114 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0036 --- Epoch 317 / 1369 - 1950 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0099 --- Epoch 318 / 1369 - 1951 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0008 Iteration 80, loss = 0.0013 --- Epoch 319 / 1369 - 1952 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0079 --- Epoch 320 / 1369 - 1953 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0015 --- Epoch 321 / 1369 - 1954 epochs total Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0163 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0038 --- Epoch 322 / 1369 - 1955 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0022 --- Epoch 323 / 1369 - 1956 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0010 Iteration 40, loss = 0.0090 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0055 --- Epoch 324 / 1369 - 1957 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0078 --- Epoch 325 / 1369 - 1958 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0162 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0017 --- Epoch 326 / 1369 - 1959 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0100 --- Epoch 327 / 1369 - 1960 epochs total Iteration 0, loss = 0.0104 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0054 --- Epoch 328 / 1369 - 1961 epochs total Iteration 0, loss = 0.0084 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0036 --- Epoch 329 / 1369 - 1962 epochs total Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0087 --- Epoch 330 / 1369 - 1963 epochs total Iteration 0, loss = 0.0165 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0035 --- Epoch 331 / 1369 - 1964 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0115 Iteration 40, loss = 0.0164 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0014 --- Epoch 332 / 1369 - 1965 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0038 --- Epoch 333 / 1369 - 1966 epochs total Iteration 0, loss = 0.0144 Iteration 20, loss = 0.0156 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0329 --- Epoch 334 / 1369 - 1967 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0005 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0015 --- Epoch 335 / 1369 - 1968 epochs total Iteration 0, loss = 0.0101 Iteration 20, loss = 0.0204 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0173 Iteration 80, loss = 0.0048 --- Epoch 336 / 1369 - 1969 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0022 --- Epoch 337 / 1369 - 1970 epochs total Iteration 0, loss = 0.0155 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0159 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0016 --- Epoch 338 / 1369 - 1971 epochs total Iteration 0, loss = 0.0006 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0076 --- Epoch 339 / 1369 - 1972 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0008 Iteration 80, loss = 0.0034 --- Epoch 340 / 1369 - 1973 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0011 Iteration 80, loss = 0.0052 --- Epoch 341 / 1369 - 1974 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0142 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0011 --- Epoch 342 / 1369 - 1975 epochs total Iteration 0, loss = 0.0180 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0114 Iteration 80, loss = 0.0151 --- Epoch 343 / 1369 - 1976 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0020 --- Epoch 344 / 1369 - 1977 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0005 Iteration 80, loss = 0.0095 --- Epoch 345 / 1369 - 1978 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0024 --- Epoch 346 / 1369 - 1979 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0013 --- Epoch 347 / 1369 - 1980 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0009 --- Epoch 348 / 1369 - 1981 epochs total Iteration 0, loss = 0.0124 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0060 --- Epoch 349 / 1369 - 1982 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0333 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0067 --- Epoch 350 / 1369 - 1983 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0026 --- Epoch 351 / 1369 - 1984 epochs total Iteration 0, loss = 0.0149 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0081 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0018 --- Epoch 352 / 1369 - 1985 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0035 --- Epoch 353 / 1369 - 1986 epochs total Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0158 Iteration 40, loss = 0.0009 Iteration 60, loss = 0.0010 Iteration 80, loss = 0.0256 --- Epoch 354 / 1369 - 1987 epochs total Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0050 --- Epoch 355 / 1369 - 1988 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0147 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0020 --- Epoch 356 / 1369 - 1989 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0223 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0052 --- Epoch 357 / 1369 - 1990 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0108 --- Epoch 358 / 1369 - 1991 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0100 --- Epoch 359 / 1369 - 1992 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0062 --- Epoch 360 / 1369 - 1993 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0008 Iteration 80, loss = 0.0021 --- Epoch 361 / 1369 - 1994 epochs total Iteration 0, loss = 0.0286 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0005 Iteration 80, loss = 0.0031 --- Epoch 362 / 1369 - 1995 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0020 --- Epoch 363 / 1369 - 1996 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0261 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0021 --- Epoch 364 / 1369 - 1997 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0061 --- Epoch 365 / 1369 - 1998 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0096 Iteration 80, loss = 0.0048 --- Epoch 366 / 1369 - 1999 epochs total Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0011 --- Epoch 367 / 1369 - 2000 epochs total Iteration 0, loss = 0.0149 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0020 --- Epoch 368 / 1369 - 2001 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0069 --- Epoch 369 / 1369 - 2002 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0023 --- Epoch 370 / 1369 - 2003 epochs total Iteration 0, loss = 0.0242 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0128 Iteration 80, loss = 0.0034 --- Epoch 371 / 1369 - 2004 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0067 --- Epoch 372 / 1369 - 2005 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0023 --- Epoch 373 / 1369 - 2006 epochs total Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0134 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0049 --- Epoch 374 / 1369 - 2007 epochs total Iteration 0, loss = 0.0109 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0054 --- Epoch 375 / 1369 - 2008 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0033 --- Epoch 376 / 1369 - 2009 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0011 --- Epoch 377 / 1369 - 2010 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0009 Iteration 80, loss = 0.0054 --- Epoch 378 / 1369 - 2011 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0131 --- Epoch 379 / 1369 - 2012 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0009 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0046 --- Epoch 380 / 1369 - 2013 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0296 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0077 --- Epoch 381 / 1369 - 2014 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0016 --- Epoch 382 / 1369 - 2015 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0016 --- Epoch 383 / 1369 - 2016 epochs total Iteration 0, loss = 0.0127 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0058 --- Epoch 384 / 1369 - 2017 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0009 Iteration 60, loss = 0.0082 Iteration 80, loss = 0.0031 --- Epoch 385 / 1369 - 2018 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0069 --- Epoch 386 / 1369 - 2019 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0027 --- Epoch 387 / 1369 - 2020 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0011 --- Epoch 388 / 1369 - 2021 epochs total Iteration 0, loss = 0.0100 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0047 --- Epoch 389 / 1369 - 2022 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0034 --- Epoch 390 / 1369 - 2023 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0035 --- Epoch 391 / 1369 - 2024 epochs total Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0219 Iteration 80, loss = 0.0007 --- Epoch 392 / 1369 - 2025 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0134 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0018 --- Epoch 393 / 1369 - 2026 epochs total Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0021 --- Epoch 394 / 1369 - 2027 epochs total Iteration 0, loss = 0.0097 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0075 --- Epoch 395 / 1369 - 2028 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0017 --- Epoch 396 / 1369 - 2029 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0022 --- Epoch 397 / 1369 - 2030 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0352 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0058 --- Epoch 398 / 1369 - 2031 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0056 --- Epoch 399 / 1369 - 2032 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0009 --- Epoch 400 / 1369 - 2033 epochs total Iteration 0, loss = 0.0109 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0109 --- Epoch 401 / 1369 - 2034 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0127 --- Epoch 402 / 1369 - 2035 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0013 --- Epoch 403 / 1369 - 2036 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0079 --- Epoch 404 / 1369 - 2037 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0069 --- Epoch 405 / 1369 - 2038 epochs total Iteration 0, loss = 0.0010 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0070 --- Epoch 406 / 1369 - 2039 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0152 --- Epoch 407 / 1369 - 2040 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0146 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0044 --- Epoch 408 / 1369 - 2041 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0157 Iteration 60, loss = 0.0500 Iteration 80, loss = 0.0037 --- Epoch 409 / 1369 - 2042 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0101 Iteration 80, loss = 0.0093 --- Epoch 410 / 1369 - 2043 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0023 --- Epoch 411 / 1369 - 2044 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0100 Iteration 40, loss = 0.0155 Iteration 60, loss = 0.0009 Iteration 80, loss = 0.0109 --- Epoch 412 / 1369 - 2045 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0046 --- Epoch 413 / 1369 - 2046 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0222 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0037 --- Epoch 414 / 1369 - 2047 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0030 --- Epoch 415 / 1369 - 2048 epochs total Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0153 Iteration 80, loss = 0.0023 --- Epoch 416 / 1369 - 2049 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0011 Iteration 80, loss = 0.0024 --- Epoch 417 / 1369 - 2050 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0029 --- Epoch 418 / 1369 - 2051 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0068 --- Epoch 419 / 1369 - 2052 epochs total Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0106 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0041 --- Epoch 420 / 1369 - 2053 epochs total Iteration 0, loss = 0.0157 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0094 --- Epoch 421 / 1369 - 2054 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0108 Iteration 40, loss = 0.0182 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0088 --- Epoch 422 / 1369 - 2055 epochs total Iteration 0, loss = 0.0090 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0014 --- Epoch 423 / 1369 - 2056 epochs total Iteration 0, loss = 0.0085 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0012 --- Epoch 424 / 1369 - 2057 epochs total Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0090 --- Epoch 425 / 1369 - 2058 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0208 Iteration 80, loss = 0.0033 --- Epoch 426 / 1369 - 2059 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0022 --- Epoch 427 / 1369 - 2060 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0109 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0058 --- Epoch 428 / 1369 - 2061 epochs total Iteration 0, loss = 0.0207 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0038 --- Epoch 429 / 1369 - 2062 epochs total Iteration 0, loss = 0.0191 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0081 Iteration 60, loss = 0.0123 Iteration 80, loss = 0.0029 --- Epoch 430 / 1369 - 2063 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0099 Iteration 80, loss = 0.0006 --- Epoch 431 / 1369 - 2064 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0030 --- Epoch 432 / 1369 - 2065 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0010 --- Epoch 433 / 1369 - 2066 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0021 --- Epoch 434 / 1369 - 2067 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0188 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0008 --- Epoch 435 / 1369 - 2068 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0100 --- Epoch 436 / 1369 - 2069 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0084 Iteration 60, loss = 0.0008 Iteration 80, loss = 0.0027 --- Epoch 437 / 1369 - 2070 epochs total Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0018 --- Epoch 438 / 1369 - 2071 epochs total Iteration 0, loss = 0.0203 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0079 --- Epoch 439 / 1369 - 2072 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0007 Iteration 80, loss = 0.0084 --- Epoch 440 / 1369 - 2073 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0237 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0115 Iteration 80, loss = 0.0058 --- Epoch 441 / 1369 - 2074 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0139 Iteration 80, loss = 0.0033 --- Epoch 442 / 1369 - 2075 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0025 --- Epoch 443 / 1369 - 2076 epochs total Iteration 0, loss = 0.0170 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0010 Iteration 80, loss = 0.0112 --- Epoch 444 / 1369 - 2077 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0008 --- Epoch 445 / 1369 - 2078 epochs total Iteration 0, loss = 0.0171 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0034 --- Epoch 446 / 1369 - 2079 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0081 --- Epoch 447 / 1369 - 2080 epochs total Iteration 0, loss = 0.0113 Iteration 20, loss = 0.0137 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0081 --- Epoch 448 / 1369 - 2081 epochs total Iteration 0, loss = 0.0101 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0015 --- Epoch 449 / 1369 - 2082 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0092 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0040 --- Epoch 450 / 1369 - 2083 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0016 --- Epoch 451 / 1369 - 2084 epochs total Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0046 --- Epoch 452 / 1369 - 2085 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0061 --- Epoch 453 / 1369 - 2086 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0311 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0090 --- Epoch 454 / 1369 - 2087 epochs total Iteration 0, loss = 0.0070 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0042 --- Epoch 455 / 1369 - 2088 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0140 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0037 --- Epoch 456 / 1369 - 2089 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0208 --- Epoch 457 / 1369 - 2090 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0009 --- Epoch 458 / 1369 - 2091 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0132 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0179 --- Epoch 459 / 1369 - 2092 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0169 Iteration 60, loss = 0.0011 Iteration 80, loss = 0.0044 --- Epoch 460 / 1369 - 2093 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0006 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0019 --- Epoch 461 / 1369 - 2094 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0064 --- Epoch 462 / 1369 - 2095 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0144 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0099 Iteration 80, loss = 0.0011 --- Epoch 463 / 1369 - 2096 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0008 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0048 --- Epoch 464 / 1369 - 2097 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0019 --- Epoch 465 / 1369 - 2098 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0061 --- Epoch 466 / 1369 - 2099 epochs total Iteration 0, loss = 0.0135 Iteration 20, loss = 0.0010 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0053 --- Epoch 467 / 1369 - 2100 epochs total Iteration 0, loss = 0.0090 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0045 --- Epoch 468 / 1369 - 2101 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0192 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0025 --- Epoch 469 / 1369 - 2102 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0019 --- Epoch 470 / 1369 - 2103 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0206 Iteration 80, loss = 0.0110 --- Epoch 471 / 1369 - 2104 epochs total Iteration 0, loss = 0.0005 Iteration 20, loss = 0.0128 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0032 --- Epoch 472 / 1369 - 2105 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0226 --- Epoch 473 / 1369 - 2106 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0024 --- Epoch 474 / 1369 - 2107 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0050 --- Epoch 475 / 1369 - 2108 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0142 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0037 --- Epoch 476 / 1369 - 2109 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0114 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0050 --- Epoch 477 / 1369 - 2110 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0172 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0156 --- Epoch 478 / 1369 - 2111 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0020 --- Epoch 479 / 1369 - 2112 epochs total Iteration 0, loss = 0.0134 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0065 --- Epoch 480 / 1369 - 2113 epochs total Iteration 0, loss = 0.0006 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0022 --- Epoch 481 / 1369 - 2114 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0015 --- Epoch 482 / 1369 - 2115 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0082 --- Epoch 483 / 1369 - 2116 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0011 Iteration 80, loss = 0.0015 --- Epoch 484 / 1369 - 2117 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0009 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0012 --- Epoch 485 / 1369 - 2118 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0038 --- Epoch 486 / 1369 - 2119 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0006 Iteration 60, loss = 0.0007 Iteration 80, loss = 0.0014 --- Epoch 487 / 1369 - 2120 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0042 --- Epoch 488 / 1369 - 2121 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0051 --- Epoch 489 / 1369 - 2122 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0065 --- Epoch 490 / 1369 - 2123 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0088 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0053 --- Epoch 491 / 1369 - 2124 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0049 --- Epoch 492 / 1369 - 2125 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0098 --- Epoch 493 / 1369 - 2126 epochs total Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0017 --- Epoch 494 / 1369 - 2127 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0015 --- Epoch 495 / 1369 - 2128 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0021 --- Epoch 496 / 1369 - 2129 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0024 --- Epoch 497 / 1369 - 2130 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0148 --- Epoch 498 / 1369 - 2131 epochs total Iteration 0, loss = 0.0184 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0057 --- Epoch 499 / 1369 - 2132 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0018 --- Epoch 500 / 1369 - 2133 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0029 --- Epoch 501 / 1369 - 2134 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0056 --- Epoch 502 / 1369 - 2135 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0033 --- Epoch 503 / 1369 - 2136 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0038 --- Epoch 504 / 1369 - 2137 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0073 --- Epoch 505 / 1369 - 2138 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0021 --- Epoch 506 / 1369 - 2139 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0031 --- Epoch 507 / 1369 - 2140 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0046 --- Epoch 508 / 1369 - 2141 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0114 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0055 --- Epoch 509 / 1369 - 2142 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0088 --- Epoch 510 / 1369 - 2143 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0148 --- Epoch 511 / 1369 - 2144 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0039 --- Epoch 512 / 1369 - 2145 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0178 Iteration 80, loss = 0.0031 --- Epoch 513 / 1369 - 2146 epochs total Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0226 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0036 --- Epoch 514 / 1369 - 2147 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0068 --- Epoch 515 / 1369 - 2148 epochs total Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0048 --- Epoch 516 / 1369 - 2149 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0010 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0017 --- Epoch 517 / 1369 - 2150 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0025 --- Epoch 518 / 1369 - 2151 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0047 --- Epoch 519 / 1369 - 2152 epochs total Iteration 0, loss = 0.0139 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0036 --- Epoch 520 / 1369 - 2153 epochs total Iteration 0, loss = 0.0007 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0116 --- Epoch 521 / 1369 - 2154 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0118 --- Epoch 522 / 1369 - 2155 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0035 --- Epoch 523 / 1369 - 2156 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0045 --- Epoch 524 / 1369 - 2157 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0019 --- Epoch 525 / 1369 - 2158 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0036 --- Epoch 526 / 1369 - 2159 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0035 --- Epoch 527 / 1369 - 2160 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0084 --- Epoch 528 / 1369 - 2161 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0011 --- Epoch 529 / 1369 - 2162 epochs total Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0058 --- Epoch 530 / 1369 - 2163 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0012 --- Epoch 531 / 1369 - 2164 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0171 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0048 --- Epoch 532 / 1369 - 2165 epochs total Iteration 0, loss = 0.0352 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0029 --- Epoch 533 / 1369 - 2166 epochs total Iteration 0, loss = 0.0215 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0036 --- Epoch 534 / 1369 - 2167 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0025 --- Epoch 535 / 1369 - 2168 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0081 --- Epoch 536 / 1369 - 2169 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0016 --- Epoch 537 / 1369 - 2170 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0096 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0048 --- Epoch 538 / 1369 - 2171 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0127 --- Epoch 539 / 1369 - 2172 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0054 --- Epoch 540 / 1369 - 2173 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0009 --- Epoch 541 / 1369 - 2174 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0041 --- Epoch 542 / 1369 - 2175 epochs total Iteration 0, loss = 0.0192 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0007 Iteration 80, loss = 0.0026 --- Epoch 543 / 1369 - 2176 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0071 --- Epoch 544 / 1369 - 2177 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0006 --- Epoch 545 / 1369 - 2178 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0053 --- Epoch 546 / 1369 - 2179 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0130 --- Epoch 547 / 1369 - 2180 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0046 --- Epoch 548 / 1369 - 2181 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0310 Iteration 80, loss = 0.0043 --- Epoch 549 / 1369 - 2182 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0010 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0031 --- Epoch 550 / 1369 - 2183 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0005 --- Epoch 551 / 1369 - 2184 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0021 --- Epoch 552 / 1369 - 2185 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0007 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0024 --- Epoch 553 / 1369 - 2186 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0043 --- Epoch 554 / 1369 - 2187 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0017 --- Epoch 555 / 1369 - 2188 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0083 --- Epoch 556 / 1369 - 2189 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0018 --- Epoch 557 / 1369 - 2190 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0021 --- Epoch 558 / 1369 - 2191 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0090 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0057 --- Epoch 559 / 1369 - 2192 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0144 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0139 --- Epoch 560 / 1369 - 2193 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0011 --- Epoch 561 / 1369 - 2194 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0185 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0045 --- Epoch 562 / 1369 - 2195 epochs total Iteration 0, loss = 0.0242 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0108 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0122 --- Epoch 563 / 1369 - 2196 epochs total Iteration 0, loss = 0.0083 Iteration 20, loss = 0.0310 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0008 Iteration 80, loss = 0.0019 --- Epoch 564 / 1369 - 2197 epochs total Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0049 --- Epoch 565 / 1369 - 2198 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0023 --- Epoch 566 / 1369 - 2199 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0019 --- Epoch 567 / 1369 - 2200 epochs total Iteration 0, loss = 0.0010 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0113 --- Epoch 568 / 1369 - 2201 epochs total Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0156 Iteration 80, loss = 0.0030 --- Epoch 569 / 1369 - 2202 epochs total Iteration 0, loss = 0.0007 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0121 Iteration 80, loss = 0.0414 --- Epoch 570 / 1369 - 2203 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0131 Iteration 80, loss = 0.0073 --- Epoch 571 / 1369 - 2204 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0151 --- Epoch 572 / 1369 - 2205 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0029 --- Epoch 573 / 1369 - 2206 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0172 --- Epoch 574 / 1369 - 2207 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0021 --- Epoch 575 / 1369 - 2208 epochs total Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0083 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0081 --- Epoch 576 / 1369 - 2209 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0018 --- Epoch 577 / 1369 - 2210 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0027 --- Epoch 578 / 1369 - 2211 epochs total Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0022 --- Epoch 579 / 1369 - 2212 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0030 --- Epoch 580 / 1369 - 2213 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0062 --- Epoch 581 / 1369 - 2214 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0029 --- Epoch 582 / 1369 - 2215 epochs total Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0282 Iteration 80, loss = 0.0055 --- Epoch 583 / 1369 - 2216 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0314 --- Epoch 584 / 1369 - 2217 epochs total Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0016 --- Epoch 585 / 1369 - 2218 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0038 --- Epoch 586 / 1369 - 2219 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0101 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0030 --- Epoch 587 / 1369 - 2220 epochs total Iteration 0, loss = 0.0008 Iteration 20, loss = 0.0124 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0007 Iteration 80, loss = 0.0010 --- Epoch 588 / 1369 - 2221 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0048 --- Epoch 589 / 1369 - 2222 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0015 --- Epoch 590 / 1369 - 2223 epochs total Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0007 Iteration 60, loss = 0.0123 Iteration 80, loss = 0.0040 --- Epoch 591 / 1369 - 2224 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0021 --- Epoch 592 / 1369 - 2225 epochs total Iteration 0, loss = 0.0110 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0093 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0086 --- Epoch 593 / 1369 - 2226 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0032 --- Epoch 594 / 1369 - 2227 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0022 --- Epoch 595 / 1369 - 2228 epochs total Iteration 0, loss = 0.0104 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0132 --- Epoch 596 / 1369 - 2229 epochs total Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0181 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0113 Iteration 80, loss = 0.0085 --- Epoch 597 / 1369 - 2230 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0108 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0091 --- Epoch 598 / 1369 - 2231 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0015 --- Epoch 599 / 1369 - 2232 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0127 --- Epoch 600 / 1369 - 2233 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0065 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0118 --- Epoch 601 / 1369 - 2234 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0029 --- Epoch 602 / 1369 - 2235 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0023 --- Epoch 603 / 1369 - 2236 epochs total Iteration 0, loss = 0.0103 Iteration 20, loss = 0.0146 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0013 --- Epoch 604 / 1369 - 2237 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0033 --- Epoch 605 / 1369 - 2238 epochs total Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0096 Iteration 80, loss = 0.0033 --- Epoch 606 / 1369 - 2239 epochs total Iteration 0, loss = 0.0131 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0017 --- Epoch 607 / 1369 - 2240 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0111 Iteration 80, loss = 0.0023 --- Epoch 608 / 1369 - 2241 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0015 --- Epoch 609 / 1369 - 2242 epochs total Iteration 0, loss = 0.0097 Iteration 20, loss = 0.0090 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0053 --- Epoch 610 / 1369 - 2243 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0030 --- Epoch 611 / 1369 - 2244 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0300 Iteration 80, loss = 0.0074 --- Epoch 612 / 1369 - 2245 epochs total Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0083 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0033 --- Epoch 613 / 1369 - 2246 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0012 --- Epoch 614 / 1369 - 2247 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0209 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0009 --- Epoch 615 / 1369 - 2248 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0164 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0040 --- Epoch 616 / 1369 - 2249 epochs total Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0030 --- Epoch 617 / 1369 - 2250 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0014 --- Epoch 618 / 1369 - 2251 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0050 --- Epoch 619 / 1369 - 2252 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0041 --- Epoch 620 / 1369 - 2253 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0093 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0015 --- Epoch 621 / 1369 - 2254 epochs total Iteration 0, loss = 0.0070 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0040 --- Epoch 622 / 1369 - 2255 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0022 --- Epoch 623 / 1369 - 2256 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0053 --- Epoch 624 / 1369 - 2257 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0166 Iteration 80, loss = 0.0029 --- Epoch 625 / 1369 - 2258 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0174 Iteration 80, loss = 0.0038 --- Epoch 626 / 1369 - 2259 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0084 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0030 --- Epoch 627 / 1369 - 2260 epochs total Iteration 0, loss = 0.0250 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0014 --- Epoch 628 / 1369 - 2261 epochs total Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0040 --- Epoch 629 / 1369 - 2262 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0045 --- Epoch 630 / 1369 - 2263 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0168 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0029 --- Epoch 631 / 1369 - 2264 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0182 --- Epoch 632 / 1369 - 2265 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0053 --- Epoch 633 / 1369 - 2266 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0090 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0042 --- Epoch 634 / 1369 - 2267 epochs total Iteration 0, loss = 0.0109 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0039 --- Epoch 635 / 1369 - 2268 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0010 --- Epoch 636 / 1369 - 2269 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0136 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0013 --- Epoch 637 / 1369 - 2270 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0019 --- Epoch 638 / 1369 - 2271 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0046 --- Epoch 639 / 1369 - 2272 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0062 --- Epoch 640 / 1369 - 2273 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0131 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0062 --- Epoch 641 / 1369 - 2274 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0094 --- Epoch 642 / 1369 - 2275 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0032 --- Epoch 643 / 1369 - 2276 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0017 --- Epoch 644 / 1369 - 2277 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0136 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0081 --- Epoch 645 / 1369 - 2278 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0018 --- Epoch 646 / 1369 - 2279 epochs total Iteration 0, loss = 0.0010 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0177 --- Epoch 647 / 1369 - 2280 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0112 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0025 --- Epoch 648 / 1369 - 2281 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0055 --- Epoch 649 / 1369 - 2282 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0497 Iteration 80, loss = 0.0060 --- Epoch 650 / 1369 - 2283 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0031 --- Epoch 651 / 1369 - 2284 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0043 --- Epoch 652 / 1369 - 2285 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0039 --- Epoch 653 / 1369 - 2286 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0029 --- Epoch 654 / 1369 - 2287 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0022 --- Epoch 655 / 1369 - 2288 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0034 --- Epoch 656 / 1369 - 2289 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0033 --- Epoch 657 / 1369 - 2290 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0009 --- Epoch 658 / 1369 - 2291 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0021 --- Epoch 659 / 1369 - 2292 epochs total Iteration 0, loss = 0.0083 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0007 --- Epoch 660 / 1369 - 2293 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0250 --- Epoch 661 / 1369 - 2294 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0088 --- Epoch 662 / 1369 - 2295 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0055 --- Epoch 663 / 1369 - 2296 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0014 --- Epoch 664 / 1369 - 2297 epochs total Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0120 Iteration 80, loss = 0.0056 --- Epoch 665 / 1369 - 2298 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0149 --- Epoch 666 / 1369 - 2299 epochs total Iteration 0, loss = 0.0319 Iteration 20, loss = 0.0115 Iteration 40, loss = 0.0181 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0041 --- Epoch 667 / 1369 - 2300 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0085 --- Epoch 668 / 1369 - 2301 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0059 --- Epoch 669 / 1369 - 2302 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0094 --- Epoch 670 / 1369 - 2303 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0020 --- Epoch 671 / 1369 - 2304 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0142 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0100 --- Epoch 672 / 1369 - 2305 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0008 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0030 --- Epoch 673 / 1369 - 2306 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0319 --- Epoch 674 / 1369 - 2307 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0210 Iteration 80, loss = 0.0010 --- Epoch 675 / 1369 - 2308 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0058 --- Epoch 676 / 1369 - 2309 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0280 Iteration 80, loss = 0.0085 --- Epoch 677 / 1369 - 2310 epochs total Iteration 0, loss = 0.0170 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0104 --- Epoch 678 / 1369 - 2311 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0092 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0035 --- Epoch 679 / 1369 - 2312 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0027 --- Epoch 680 / 1369 - 2313 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0023 --- Epoch 681 / 1369 - 2314 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0021 --- Epoch 682 / 1369 - 2315 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0114 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0034 --- Epoch 683 / 1369 - 2316 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0039 --- Epoch 684 / 1369 - 2317 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0016 --- Epoch 685 / 1369 - 2318 epochs total Iteration 0, loss = 0.0310 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0030 --- Epoch 686 / 1369 - 2319 epochs total Iteration 0, loss = 0.0148 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0060 --- Epoch 687 / 1369 - 2320 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0124 --- Epoch 688 / 1369 - 2321 epochs total Iteration 0, loss = 0.0242 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0016 --- Epoch 689 / 1369 - 2322 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0054 --- Epoch 690 / 1369 - 2323 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0284 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0187 --- Epoch 691 / 1369 - 2324 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0115 --- Epoch 692 / 1369 - 2325 epochs total Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0014 --- Epoch 693 / 1369 - 2326 epochs total Iteration 0, loss = 0.0135 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0015 --- Epoch 694 / 1369 - 2327 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0088 --- Epoch 695 / 1369 - 2328 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0139 --- Epoch 696 / 1369 - 2329 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0126 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0088 --- Epoch 697 / 1369 - 2330 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0016 --- Epoch 698 / 1369 - 2331 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0378 --- Epoch 699 / 1369 - 2332 epochs total Iteration 0, loss = 0.0237 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0019 --- Epoch 700 / 1369 - 2333 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0026 --- Epoch 701 / 1369 - 2334 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0126 Iteration 80, loss = 0.0022 --- Epoch 702 / 1369 - 2335 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0018 --- Epoch 703 / 1369 - 2336 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0025 --- Epoch 704 / 1369 - 2337 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0083 Iteration 80, loss = 0.0020 --- Epoch 705 / 1369 - 2338 epochs total Iteration 0, loss = 0.0082 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0008 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0060 --- Epoch 706 / 1369 - 2339 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0019 --- Epoch 707 / 1369 - 2340 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0010 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0016 --- Epoch 708 / 1369 - 2341 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0202 Iteration 60, loss = 0.0009 Iteration 80, loss = 0.0029 --- Epoch 709 / 1369 - 2342 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0126 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0019 --- Epoch 710 / 1369 - 2343 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0109 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0062 --- Epoch 711 / 1369 - 2344 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0057 --- Epoch 712 / 1369 - 2345 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0385 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0037 --- Epoch 713 / 1369 - 2346 epochs total Iteration 0, loss = 0.0129 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0069 --- Epoch 714 / 1369 - 2347 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0014 --- Epoch 715 / 1369 - 2348 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0021 --- Epoch 716 / 1369 - 2349 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0013 --- Epoch 717 / 1369 - 2350 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0127 Iteration 80, loss = 0.0087 --- Epoch 718 / 1369 - 2351 epochs total Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0005 Iteration 80, loss = 0.0035 --- Epoch 719 / 1369 - 2352 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0016 --- Epoch 720 / 1369 - 2353 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0015 --- Epoch 721 / 1369 - 2354 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0210 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0038 --- Epoch 722 / 1369 - 2355 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0005 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0032 --- Epoch 723 / 1369 - 2356 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0073 --- Epoch 724 / 1369 - 2357 epochs total Iteration 0, loss = 0.0169 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0008 --- Epoch 725 / 1369 - 2358 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0158 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0045 --- Epoch 726 / 1369 - 2359 epochs total Iteration 0, loss = 0.0161 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0104 --- Epoch 727 / 1369 - 2360 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0158 Iteration 80, loss = 0.0058 --- Epoch 728 / 1369 - 2361 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0027 --- Epoch 729 / 1369 - 2362 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0127 --- Epoch 730 / 1369 - 2363 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0035 --- Epoch 731 / 1369 - 2364 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0157 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0106 --- Epoch 732 / 1369 - 2365 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0022 --- Epoch 733 / 1369 - 2366 epochs total Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0118 Iteration 60, loss = 0.0096 Iteration 80, loss = 0.0137 --- Epoch 734 / 1369 - 2367 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0045 --- Epoch 735 / 1369 - 2368 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0023 --- Epoch 736 / 1369 - 2369 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0020 --- Epoch 737 / 1369 - 2370 epochs total Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0020 --- Epoch 738 / 1369 - 2371 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0158 Iteration 40, loss = 0.0006 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0080 --- Epoch 739 / 1369 - 2372 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0058 --- Epoch 740 / 1369 - 2373 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0027 --- Epoch 741 / 1369 - 2374 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0206 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0091 --- Epoch 742 / 1369 - 2375 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0010 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0023 --- Epoch 743 / 1369 - 2376 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0085 Iteration 80, loss = 0.0020 --- Epoch 744 / 1369 - 2377 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0158 Iteration 80, loss = 0.0269 --- Epoch 745 / 1369 - 2378 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0042 --- Epoch 746 / 1369 - 2379 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0153 --- Epoch 747 / 1369 - 2380 epochs total Iteration 0, loss = 0.0167 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0107 --- Epoch 748 / 1369 - 2381 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0008 Iteration 80, loss = 0.0123 --- Epoch 749 / 1369 - 2382 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0379 Iteration 80, loss = 0.0011 --- Epoch 750 / 1369 - 2383 epochs total Iteration 0, loss = 0.0109 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0007 --- Epoch 751 / 1369 - 2384 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0027 --- Epoch 752 / 1369 - 2385 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0071 --- Epoch 753 / 1369 - 2386 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0045 --- Epoch 754 / 1369 - 2387 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0158 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0059 --- Epoch 755 / 1369 - 2388 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0034 --- Epoch 756 / 1369 - 2389 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0199 --- Epoch 757 / 1369 - 2390 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0160 Iteration 60, loss = 0.0120 Iteration 80, loss = 0.0072 --- Epoch 758 / 1369 - 2391 epochs total Iteration 0, loss = 0.0085 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0012 --- Epoch 759 / 1369 - 2392 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0007 Iteration 80, loss = 0.0025 --- Epoch 760 / 1369 - 2393 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0069 --- Epoch 761 / 1369 - 2394 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0005 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0038 --- Epoch 762 / 1369 - 2395 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0011 --- Epoch 763 / 1369 - 2396 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0006 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0019 --- Epoch 764 / 1369 - 2397 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0112 --- Epoch 765 / 1369 - 2398 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0282 Iteration 80, loss = 0.0012 --- Epoch 766 / 1369 - 2399 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0181 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0092 --- Epoch 767 / 1369 - 2400 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0006 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0021 --- Epoch 768 / 1369 - 2401 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0194 Iteration 80, loss = 0.0025 --- Epoch 769 / 1369 - 2402 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0129 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0052 --- Epoch 770 / 1369 - 2403 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0024 --- Epoch 771 / 1369 - 2404 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0014 --- Epoch 772 / 1369 - 2405 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0025 --- Epoch 773 / 1369 - 2406 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0085 Iteration 80, loss = 0.0120 --- Epoch 774 / 1369 - 2407 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0045 --- Epoch 775 / 1369 - 2408 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0235 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0055 --- Epoch 776 / 1369 - 2409 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0172 Iteration 80, loss = 0.0058 --- Epoch 777 / 1369 - 2410 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0026 --- Epoch 778 / 1369 - 2411 epochs total Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0085 --- Epoch 779 / 1369 - 2412 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0210 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0031 --- Epoch 780 / 1369 - 2413 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0108 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0024 --- Epoch 781 / 1369 - 2414 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0127 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0027 --- Epoch 782 / 1369 - 2415 epochs total Iteration 0, loss = 0.0149 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0024 --- Epoch 783 / 1369 - 2416 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0157 Iteration 80, loss = 0.0033 --- Epoch 784 / 1369 - 2417 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0010 --- Epoch 785 / 1369 - 2418 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0036 --- Epoch 786 / 1369 - 2419 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0045 --- Epoch 787 / 1369 - 2420 epochs total Iteration 0, loss = 0.0103 Iteration 20, loss = 0.0010 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0026 --- Epoch 788 / 1369 - 2421 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0011 --- Epoch 789 / 1369 - 2422 epochs total Iteration 0, loss = 0.0200 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0128 Iteration 80, loss = 0.0039 --- Epoch 790 / 1369 - 2423 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0040 --- Epoch 791 / 1369 - 2424 epochs total Iteration 0, loss = 0.0158 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0210 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0027 --- Epoch 792 / 1369 - 2425 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0084 Iteration 60, loss = 0.0127 Iteration 80, loss = 0.0052 --- Epoch 793 / 1369 - 2426 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0080 --- Epoch 794 / 1369 - 2427 epochs total Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0165 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0080 --- Epoch 795 / 1369 - 2428 epochs total Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0038 --- Epoch 796 / 1369 - 2429 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0023 --- Epoch 797 / 1369 - 2430 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0022 --- Epoch 798 / 1369 - 2431 epochs total Iteration 0, loss = 0.0010 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0054 --- Epoch 799 / 1369 - 2432 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0035 --- Epoch 800 / 1369 - 2433 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0013 --- Epoch 801 / 1369 - 2434 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0008 --- Epoch 802 / 1369 - 2435 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0013 --- Epoch 803 / 1369 - 2436 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0023 --- Epoch 804 / 1369 - 2437 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0136 --- Epoch 805 / 1369 - 2438 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0060 --- Epoch 806 / 1369 - 2439 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0008 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0050 --- Epoch 807 / 1369 - 2440 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0024 --- Epoch 808 / 1369 - 2441 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0050 --- Epoch 809 / 1369 - 2442 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0044 --- Epoch 810 / 1369 - 2443 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0279 Iteration 40, loss = 0.0253 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0037 --- Epoch 811 / 1369 - 2444 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0139 Iteration 80, loss = 0.0107 --- Epoch 812 / 1369 - 2445 epochs total Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0279 --- Epoch 813 / 1369 - 2446 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0158 --- Epoch 814 / 1369 - 2447 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0007 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0016 --- Epoch 815 / 1369 - 2448 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0020 --- Epoch 816 / 1369 - 2449 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0098 --- Epoch 817 / 1369 - 2450 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0022 --- Epoch 818 / 1369 - 2451 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0007 Iteration 80, loss = 0.0029 --- Epoch 819 / 1369 - 2452 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0050 --- Epoch 820 / 1369 - 2453 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0017 --- Epoch 821 / 1369 - 2454 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0006 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0063 --- Epoch 822 / 1369 - 2455 epochs total Iteration 0, loss = 0.0205 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0021 --- Epoch 823 / 1369 - 2456 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0181 --- Epoch 824 / 1369 - 2457 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0067 --- Epoch 825 / 1369 - 2458 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0173 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0074 --- Epoch 826 / 1369 - 2459 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0171 Iteration 80, loss = 0.0058 --- Epoch 827 / 1369 - 2460 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0187 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0005 Iteration 80, loss = 0.0190 --- Epoch 828 / 1369 - 2461 epochs total Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0020 --- Epoch 829 / 1369 - 2462 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0026 --- Epoch 830 / 1369 - 2463 epochs total Iteration 0, loss = 0.0147 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0021 --- Epoch 831 / 1369 - 2464 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0120 --- Epoch 832 / 1369 - 2465 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0016 --- Epoch 833 / 1369 - 2466 epochs total Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0005 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0008 --- Epoch 834 / 1369 - 2467 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0105 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0045 --- Epoch 835 / 1369 - 2468 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0056 --- Epoch 836 / 1369 - 2469 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0187 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0042 --- Epoch 837 / 1369 - 2470 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0047 --- Epoch 838 / 1369 - 2471 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0159 --- Epoch 839 / 1369 - 2472 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0042 --- Epoch 840 / 1369 - 2473 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0092 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0120 --- Epoch 841 / 1369 - 2474 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0033 --- Epoch 842 / 1369 - 2475 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0009 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0010 --- Epoch 843 / 1369 - 2476 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0005 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0023 --- Epoch 844 / 1369 - 2477 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0190 Iteration 60, loss = 0.0121 Iteration 80, loss = 0.0051 --- Epoch 845 / 1369 - 2478 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0036 --- Epoch 846 / 1369 - 2479 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0073 --- Epoch 847 / 1369 - 2480 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0074 --- Epoch 848 / 1369 - 2481 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0164 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0066 --- Epoch 849 / 1369 - 2482 epochs total Iteration 0, loss = 0.0253 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0082 --- Epoch 850 / 1369 - 2483 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0021 --- Epoch 851 / 1369 - 2484 epochs total Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0146 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0007 --- Epoch 852 / 1369 - 2485 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0028 --- Epoch 853 / 1369 - 2486 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0007 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0055 --- Epoch 854 / 1369 - 2487 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0046 --- Epoch 855 / 1369 - 2488 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0005 Iteration 60, loss = 0.0192 Iteration 80, loss = 0.0060 --- Epoch 856 / 1369 - 2489 epochs total Iteration 0, loss = 0.0223 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0017 --- Epoch 857 / 1369 - 2490 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0219 --- Epoch 858 / 1369 - 2491 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0085 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0146 --- Epoch 859 / 1369 - 2492 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0014 --- Epoch 860 / 1369 - 2493 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0012 --- Epoch 861 / 1369 - 2494 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0280 --- Epoch 862 / 1369 - 2495 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0016 --- Epoch 863 / 1369 - 2496 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0097 Iteration 80, loss = 0.0020 --- Epoch 864 / 1369 - 2497 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0032 --- Epoch 865 / 1369 - 2498 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0011 Iteration 80, loss = 0.0034 --- Epoch 866 / 1369 - 2499 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0036 --- Epoch 867 / 1369 - 2500 epochs total Iteration 0, loss = 0.0133 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0400 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0047 --- Epoch 868 / 1369 - 2501 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0500 --- Epoch 869 / 1369 - 2502 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0020 --- Epoch 870 / 1369 - 2503 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0020 --- Epoch 871 / 1369 - 2504 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0122 --- Epoch 872 / 1369 - 2505 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0035 --- Epoch 873 / 1369 - 2506 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0007 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0012 --- Epoch 874 / 1369 - 2507 epochs total Iteration 0, loss = 0.0147 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0078 --- Epoch 875 / 1369 - 2508 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0152 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0007 --- Epoch 876 / 1369 - 2509 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0022 --- Epoch 877 / 1369 - 2510 epochs total Iteration 0, loss = 0.0190 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0089 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0014 --- Epoch 878 / 1369 - 2511 epochs total Iteration 0, loss = 0.0129 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0059 --- Epoch 879 / 1369 - 2512 epochs total Iteration 0, loss = 0.0010 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0059 --- Epoch 880 / 1369 - 2513 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0170 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0022 --- Epoch 881 / 1369 - 2514 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0019 --- Epoch 882 / 1369 - 2515 epochs total Iteration 0, loss = 0.0008 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0049 --- Epoch 883 / 1369 - 2516 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0121 --- Epoch 884 / 1369 - 2517 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0112 Iteration 40, loss = 0.0097 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0027 --- Epoch 885 / 1369 - 2518 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0110 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0015 --- Epoch 886 / 1369 - 2519 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0049 --- Epoch 887 / 1369 - 2520 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0010 Iteration 60, loss = 0.0007 Iteration 80, loss = 0.0013 --- Epoch 888 / 1369 - 2521 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0101 --- Epoch 889 / 1369 - 2522 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0010 Iteration 80, loss = 0.0020 --- Epoch 890 / 1369 - 2523 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0059 --- Epoch 891 / 1369 - 2524 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0029 --- Epoch 892 / 1369 - 2525 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0018 --- Epoch 893 / 1369 - 2526 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0126 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0027 --- Epoch 894 / 1369 - 2527 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0039 --- Epoch 895 / 1369 - 2528 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0237 Iteration 60, loss = 0.0184 Iteration 80, loss = 0.0059 --- Epoch 896 / 1369 - 2529 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0035 --- Epoch 897 / 1369 - 2530 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0010 --- Epoch 898 / 1369 - 2531 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0013 --- Epoch 899 / 1369 - 2532 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0375 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0005 --- Epoch 900 / 1369 - 2533 epochs total Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0031 --- Epoch 901 / 1369 - 2534 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0013 --- Epoch 902 / 1369 - 2535 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0232 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0135 --- Epoch 903 / 1369 - 2536 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0127 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0139 Iteration 80, loss = 0.0083 --- Epoch 904 / 1369 - 2537 epochs total Iteration 0, loss = 0.0226 Iteration 20, loss = 0.0410 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0121 --- Epoch 905 / 1369 - 2538 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0453 Iteration 80, loss = 0.0031 --- Epoch 906 / 1369 - 2539 epochs total Iteration 0, loss = 0.0310 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0033 --- Epoch 907 / 1369 - 2540 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0126 Iteration 80, loss = 0.0048 --- Epoch 908 / 1369 - 2541 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0134 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0017 --- Epoch 909 / 1369 - 2542 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0021 --- Epoch 910 / 1369 - 2543 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0127 --- Epoch 911 / 1369 - 2544 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0029 --- Epoch 912 / 1369 - 2545 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0005 --- Epoch 913 / 1369 - 2546 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0014 --- Epoch 914 / 1369 - 2547 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0006 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0058 --- Epoch 915 / 1369 - 2548 epochs total Iteration 0, loss = 0.0139 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0009 Iteration 80, loss = 0.0044 --- Epoch 916 / 1369 - 2549 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0025 --- Epoch 917 / 1369 - 2550 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0119 --- Epoch 918 / 1369 - 2551 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0043 --- Epoch 919 / 1369 - 2552 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0073 --- Epoch 920 / 1369 - 2553 epochs total Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0028 --- Epoch 921 / 1369 - 2554 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0159 Iteration 40, loss = 0.0256 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0014 --- Epoch 922 / 1369 - 2555 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0086 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0048 --- Epoch 923 / 1369 - 2556 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0046 --- Epoch 924 / 1369 - 2557 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0027 --- Epoch 925 / 1369 - 2558 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0025 --- Epoch 926 / 1369 - 2559 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0064 --- Epoch 927 / 1369 - 2560 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0048 --- Epoch 928 / 1369 - 2561 epochs total Iteration 0, loss = 0.0010 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0012 --- Epoch 929 / 1369 - 2562 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0023 --- Epoch 930 / 1369 - 2563 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0029 --- Epoch 931 / 1369 - 2564 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0194 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0128 Iteration 80, loss = 0.0051 --- Epoch 932 / 1369 - 2565 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0143 --- Epoch 933 / 1369 - 2566 epochs total Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0034 --- Epoch 934 / 1369 - 2567 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0378 Iteration 80, loss = 0.0055 --- Epoch 935 / 1369 - 2568 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0024 --- Epoch 936 / 1369 - 2569 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0157 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0024 --- Epoch 937 / 1369 - 2570 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0075 --- Epoch 938 / 1369 - 2571 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0036 --- Epoch 939 / 1369 - 2572 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0165 Iteration 80, loss = 0.0115 --- Epoch 940 / 1369 - 2573 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0192 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0032 --- Epoch 941 / 1369 - 2574 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0083 --- Epoch 942 / 1369 - 2575 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0222 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0036 --- Epoch 943 / 1369 - 2576 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0015 --- Epoch 944 / 1369 - 2577 epochs total Iteration 0, loss = 0.0181 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0016 --- Epoch 945 / 1369 - 2578 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0018 --- Epoch 946 / 1369 - 2579 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0077 --- Epoch 947 / 1369 - 2580 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0093 --- Epoch 948 / 1369 - 2581 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0008 --- Epoch 949 / 1369 - 2582 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0094 --- Epoch 950 / 1369 - 2583 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0033 --- Epoch 951 / 1369 - 2584 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0110 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0128 --- Epoch 952 / 1369 - 2585 epochs total Iteration 0, loss = 0.0070 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0010 Iteration 80, loss = 0.0021 --- Epoch 953 / 1369 - 2586 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0015 --- Epoch 954 / 1369 - 2587 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0026 --- Epoch 955 / 1369 - 2588 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0129 Iteration 40, loss = 0.0333 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0121 --- Epoch 956 / 1369 - 2589 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0111 --- Epoch 957 / 1369 - 2590 epochs total Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0070 --- Epoch 958 / 1369 - 2591 epochs total Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0084 --- Epoch 959 / 1369 - 2592 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0011 --- Epoch 960 / 1369 - 2593 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0062 --- Epoch 961 / 1369 - 2594 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0004 Iteration 80, loss = 0.0038 --- Epoch 962 / 1369 - 2595 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0100 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0075 --- Epoch 963 / 1369 - 2596 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0041 --- Epoch 964 / 1369 - 2597 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0061 --- Epoch 965 / 1369 - 2598 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0025 --- Epoch 966 / 1369 - 2599 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0063 --- Epoch 967 / 1369 - 2600 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0096 --- Epoch 968 / 1369 - 2601 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0120 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0020 --- Epoch 969 / 1369 - 2602 epochs total Iteration 0, loss = 0.0191 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0007 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0185 --- Epoch 970 / 1369 - 2603 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0013 --- Epoch 971 / 1369 - 2604 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0040 --- Epoch 972 / 1369 - 2605 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0237 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0070 --- Epoch 973 / 1369 - 2606 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0032 --- Epoch 974 / 1369 - 2607 epochs total Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0022 --- Epoch 975 / 1369 - 2608 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0018 --- Epoch 976 / 1369 - 2609 epochs total Iteration 0, loss = 0.0300 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0035 --- Epoch 977 / 1369 - 2610 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0108 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0094 --- Epoch 978 / 1369 - 2611 epochs total Iteration 0, loss = 0.0006 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0123 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0021 --- Epoch 979 / 1369 - 2612 epochs total Iteration 0, loss = 0.0007 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0007 --- Epoch 980 / 1369 - 2613 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0008 Iteration 80, loss = 0.0062 --- Epoch 981 / 1369 - 2614 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0126 Iteration 40, loss = 0.0008 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0242 --- Epoch 982 / 1369 - 2615 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0177 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0050 --- Epoch 983 / 1369 - 2616 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0147 Iteration 80, loss = 0.0026 --- Epoch 984 / 1369 - 2617 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0042 --- Epoch 985 / 1369 - 2618 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0010 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0031 --- Epoch 986 / 1369 - 2619 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0061 --- Epoch 987 / 1369 - 2620 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0202 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0030 --- Epoch 988 / 1369 - 2621 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0093 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0053 --- Epoch 989 / 1369 - 2622 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0007 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0014 --- Epoch 990 / 1369 - 2623 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0155 Iteration 80, loss = 0.0030 --- Epoch 991 / 1369 - 2624 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0206 Iteration 40, loss = 0.0078 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0026 --- Epoch 992 / 1369 - 2625 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0010 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0016 --- Epoch 993 / 1369 - 2626 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0059 --- Epoch 994 / 1369 - 2627 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0101 Iteration 60, loss = 0.0174 Iteration 80, loss = 0.0009 --- Epoch 995 / 1369 - 2628 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0010 Iteration 80, loss = 0.0036 --- Epoch 996 / 1369 - 2629 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0014 --- Epoch 997 / 1369 - 2630 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0070 --- Epoch 998 / 1369 - 2631 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0042 --- Epoch 999 / 1369 - 2632 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0035 --- Epoch 1000 / 1369 - 2633 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0142 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0062 --- Epoch 1001 / 1369 - 2634 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0210 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0010 --- Epoch 1002 / 1369 - 2635 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0028 --- Epoch 1003 / 1369 - 2636 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0035 --- Epoch 1004 / 1369 - 2637 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0020 --- Epoch 1005 / 1369 - 2638 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0076 --- Epoch 1006 / 1369 - 2639 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0186 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0020 --- Epoch 1007 / 1369 - 2640 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0099 --- Epoch 1008 / 1369 - 2641 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0280 Iteration 80, loss = 0.0097 --- Epoch 1009 / 1369 - 2642 epochs total Iteration 0, loss = 0.0113 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0082 --- Epoch 1010 / 1369 - 2643 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0311 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0029 --- Epoch 1011 / 1369 - 2644 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0152 Iteration 80, loss = 0.0030 --- Epoch 1012 / 1369 - 2645 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0025 --- Epoch 1013 / 1369 - 2646 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0022 --- Epoch 1014 / 1369 - 2647 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0030 --- Epoch 1015 / 1369 - 2648 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0249 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0037 --- Epoch 1016 / 1369 - 2649 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0139 Iteration 80, loss = 0.0057 --- Epoch 1017 / 1369 - 2650 epochs total Iteration 0, loss = 0.0158 Iteration 20, loss = 0.0007 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0281 Iteration 80, loss = 0.0023 --- Epoch 1018 / 1369 - 2651 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0040 --- Epoch 1019 / 1369 - 2652 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0021 --- Epoch 1020 / 1369 - 2653 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0038 --- Epoch 1021 / 1369 - 2654 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0136 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0042 --- Epoch 1022 / 1369 - 2655 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0100 Iteration 40, loss = 0.0132 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0012 --- Epoch 1023 / 1369 - 2656 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0032 --- Epoch 1024 / 1369 - 2657 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0072 --- Epoch 1025 / 1369 - 2658 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0162 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0235 --- Epoch 1026 / 1369 - 2659 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0126 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0055 --- Epoch 1027 / 1369 - 2660 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0060 --- Epoch 1028 / 1369 - 2661 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0005 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0174 Iteration 80, loss = 0.0060 --- Epoch 1029 / 1369 - 2662 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0024 --- Epoch 1030 / 1369 - 2663 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0112 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0039 --- Epoch 1031 / 1369 - 2664 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0240 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0132 --- Epoch 1032 / 1369 - 2665 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0109 Iteration 40, loss = 0.0174 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0016 --- Epoch 1033 / 1369 - 2666 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0018 --- Epoch 1034 / 1369 - 2667 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0021 --- Epoch 1035 / 1369 - 2668 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0145 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0057 --- Epoch 1036 / 1369 - 2669 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0107 --- Epoch 1037 / 1369 - 2670 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0137 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0011 Iteration 80, loss = 0.0037 --- Epoch 1038 / 1369 - 2671 epochs total Iteration 0, loss = 0.0189 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0043 --- Epoch 1039 / 1369 - 2672 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0203 Iteration 60, loss = 0.0126 Iteration 80, loss = 0.0007 --- Epoch 1040 / 1369 - 2673 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0023 --- Epoch 1041 / 1369 - 2674 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0028 --- Epoch 1042 / 1369 - 2675 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0111 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0080 --- Epoch 1043 / 1369 - 2676 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0096 --- Epoch 1044 / 1369 - 2677 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0142 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0037 --- Epoch 1045 / 1369 - 2678 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0025 --- Epoch 1046 / 1369 - 2679 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0029 --- Epoch 1047 / 1369 - 2680 epochs total Iteration 0, loss = 0.0007 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0037 --- Epoch 1048 / 1369 - 2681 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0037 --- Epoch 1049 / 1369 - 2682 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0019 --- Epoch 1050 / 1369 - 2683 epochs total Iteration 0, loss = 0.0070 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0009 Iteration 80, loss = 0.0070 --- Epoch 1051 / 1369 - 2684 epochs total Iteration 0, loss = 0.0178 Iteration 20, loss = 0.0065 Iteration 40, loss = 0.0089 Iteration 60, loss = 0.0172 Iteration 80, loss = 0.0015 --- Epoch 1052 / 1369 - 2685 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0109 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0021 --- Epoch 1053 / 1369 - 2686 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0212 Iteration 60, loss = 0.0127 Iteration 80, loss = 0.0021 --- Epoch 1054 / 1369 - 2687 epochs total Iteration 0, loss = 0.0070 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0029 --- Epoch 1055 / 1369 - 2688 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0017 --- Epoch 1056 / 1369 - 2689 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0115 --- Epoch 1057 / 1369 - 2690 epochs total Iteration 0, loss = 0.0284 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0085 --- Epoch 1058 / 1369 - 2691 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0011 --- Epoch 1059 / 1369 - 2692 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0026 --- Epoch 1060 / 1369 - 2693 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0035 --- Epoch 1061 / 1369 - 2694 epochs total Iteration 0, loss = 0.0100 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0097 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0029 --- Epoch 1062 / 1369 - 2695 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0027 --- Epoch 1063 / 1369 - 2696 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0180 Iteration 80, loss = 0.0102 --- Epoch 1064 / 1369 - 2697 epochs total Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0173 --- Epoch 1065 / 1369 - 2698 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0181 Iteration 40, loss = 0.0284 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0098 --- Epoch 1066 / 1369 - 2699 epochs total Iteration 0, loss = 0.0082 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0043 --- Epoch 1067 / 1369 - 2700 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0028 --- Epoch 1068 / 1369 - 2701 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0018 --- Epoch 1069 / 1369 - 2702 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0079 --- Epoch 1070 / 1369 - 2703 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0041 --- Epoch 1071 / 1369 - 2704 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0086 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0019 --- Epoch 1072 / 1369 - 2705 epochs total Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0006 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0192 --- Epoch 1073 / 1369 - 2706 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0138 --- Epoch 1074 / 1369 - 2707 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0059 --- Epoch 1075 / 1369 - 2708 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0100 --- Epoch 1076 / 1369 - 2709 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0045 --- Epoch 1077 / 1369 - 2710 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0024 --- Epoch 1078 / 1369 - 2711 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0095 --- Epoch 1079 / 1369 - 2712 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0027 --- Epoch 1080 / 1369 - 2713 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0235 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0025 --- Epoch 1081 / 1369 - 2714 epochs total Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0046 --- Epoch 1082 / 1369 - 2715 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0105 Iteration 60, loss = 0.0177 Iteration 80, loss = 0.0019 --- Epoch 1083 / 1369 - 2716 epochs total Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0045 --- Epoch 1084 / 1369 - 2717 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0161 Iteration 80, loss = 0.0497 --- Epoch 1085 / 1369 - 2718 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0016 --- Epoch 1086 / 1369 - 2719 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0118 --- Epoch 1087 / 1369 - 2720 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0017 --- Epoch 1088 / 1369 - 2721 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0041 --- Epoch 1089 / 1369 - 2722 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0028 --- Epoch 1090 / 1369 - 2723 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0026 --- Epoch 1091 / 1369 - 2724 epochs total Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0130 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0130 --- Epoch 1092 / 1369 - 2725 epochs total Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0010 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0011 --- Epoch 1093 / 1369 - 2726 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0083 --- Epoch 1094 / 1369 - 2727 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0125 --- Epoch 1095 / 1369 - 2728 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0114 --- Epoch 1096 / 1369 - 2729 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0033 --- Epoch 1097 / 1369 - 2730 epochs total Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0053 --- Epoch 1098 / 1369 - 2731 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0022 --- Epoch 1099 / 1369 - 2732 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0116 --- Epoch 1100 / 1369 - 2733 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0175 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0028 --- Epoch 1101 / 1369 - 2734 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0025 --- Epoch 1102 / 1369 - 2735 epochs total Iteration 0, loss = 0.0010 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0157 Iteration 60, loss = 0.0127 Iteration 80, loss = 0.0026 --- Epoch 1103 / 1369 - 2736 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0013 --- Epoch 1104 / 1369 - 2737 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0168 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0016 --- Epoch 1105 / 1369 - 2738 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0175 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0148 --- Epoch 1106 / 1369 - 2739 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0378 Iteration 80, loss = 0.0023 --- Epoch 1107 / 1369 - 2740 epochs total Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0038 --- Epoch 1108 / 1369 - 2741 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0039 --- Epoch 1109 / 1369 - 2742 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0143 Iteration 80, loss = 0.0007 --- Epoch 1110 / 1369 - 2743 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0005 --- Epoch 1111 / 1369 - 2744 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0010 --- Epoch 1112 / 1369 - 2745 epochs total Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0172 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0159 --- Epoch 1113 / 1369 - 2746 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0018 --- Epoch 1114 / 1369 - 2747 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0011 Iteration 80, loss = 0.0088 --- Epoch 1115 / 1369 - 2748 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0032 --- Epoch 1116 / 1369 - 2749 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0082 Iteration 80, loss = 0.0098 --- Epoch 1117 / 1369 - 2750 epochs total Iteration 0, loss = 0.0123 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0008 --- Epoch 1118 / 1369 - 2751 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0023 --- Epoch 1119 / 1369 - 2752 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0094 --- Epoch 1120 / 1369 - 2753 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0282 Iteration 80, loss = 0.0012 --- Epoch 1121 / 1369 - 2754 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0103 --- Epoch 1122 / 1369 - 2755 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0023 --- Epoch 1123 / 1369 - 2756 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0040 --- Epoch 1124 / 1369 - 2757 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0039 --- Epoch 1125 / 1369 - 2758 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0126 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0035 --- Epoch 1126 / 1369 - 2759 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0044 --- Epoch 1127 / 1369 - 2760 epochs total Iteration 0, loss = 0.0192 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0051 --- Epoch 1128 / 1369 - 2761 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0070 --- Epoch 1129 / 1369 - 2762 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0170 Iteration 80, loss = 0.0091 --- Epoch 1130 / 1369 - 2763 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0079 --- Epoch 1131 / 1369 - 2764 epochs total Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0045 --- Epoch 1132 / 1369 - 2765 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0068 --- Epoch 1133 / 1369 - 2766 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0090 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0186 --- Epoch 1134 / 1369 - 2767 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0052 --- Epoch 1135 / 1369 - 2768 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0019 --- Epoch 1136 / 1369 - 2769 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0168 --- Epoch 1137 / 1369 - 2770 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0181 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0135 --- Epoch 1138 / 1369 - 2771 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0114 Iteration 40, loss = 0.0010 Iteration 60, loss = 0.0123 Iteration 80, loss = 0.0031 --- Epoch 1139 / 1369 - 2772 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0016 --- Epoch 1140 / 1369 - 2773 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0029 --- Epoch 1141 / 1369 - 2774 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0085 Iteration 80, loss = 0.0023 --- Epoch 1142 / 1369 - 2775 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0007 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0049 --- Epoch 1143 / 1369 - 2776 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0006 --- Epoch 1144 / 1369 - 2777 epochs total Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0009 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0113 --- Epoch 1145 / 1369 - 2778 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0081 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0071 --- Epoch 1146 / 1369 - 2779 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0007 Iteration 80, loss = 0.0050 --- Epoch 1147 / 1369 - 2780 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0042 --- Epoch 1148 / 1369 - 2781 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0131 --- Epoch 1149 / 1369 - 2782 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0112 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0018 --- Epoch 1150 / 1369 - 2783 epochs total Iteration 0, loss = 0.0157 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0156 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0032 --- Epoch 1151 / 1369 - 2784 epochs total Iteration 0, loss = 0.0218 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0063 --- Epoch 1152 / 1369 - 2785 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0149 --- Epoch 1153 / 1369 - 2786 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0028 --- Epoch 1154 / 1369 - 2787 epochs total Iteration 0, loss = 0.0103 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0104 --- Epoch 1155 / 1369 - 2788 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0029 --- Epoch 1156 / 1369 - 2789 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0042 --- Epoch 1157 / 1369 - 2790 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0051 --- Epoch 1158 / 1369 - 2791 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0010 Iteration 40, loss = 0.0112 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0041 --- Epoch 1159 / 1369 - 2792 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0023 --- Epoch 1160 / 1369 - 2793 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0025 --- Epoch 1161 / 1369 - 2794 epochs total Iteration 0, loss = 0.0292 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0015 --- Epoch 1162 / 1369 - 2795 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0067 --- Epoch 1163 / 1369 - 2796 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0202 --- Epoch 1164 / 1369 - 2797 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0093 --- Epoch 1165 / 1369 - 2798 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0028 --- Epoch 1166 / 1369 - 2799 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0088 Iteration 60, loss = 0.0142 Iteration 80, loss = 0.0023 --- Epoch 1167 / 1369 - 2800 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0012 --- Epoch 1168 / 1369 - 2801 epochs total Iteration 0, loss = 0.0203 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0012 --- Epoch 1169 / 1369 - 2802 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0103 --- Epoch 1170 / 1369 - 2803 epochs total Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0034 --- Epoch 1171 / 1369 - 2804 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0184 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0018 --- Epoch 1172 / 1369 - 2805 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0030 --- Epoch 1173 / 1369 - 2806 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0014 --- Epoch 1174 / 1369 - 2807 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0190 Iteration 40, loss = 0.0185 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0058 --- Epoch 1175 / 1369 - 2808 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0082 --- Epoch 1176 / 1369 - 2809 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0009 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0027 --- Epoch 1177 / 1369 - 2810 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0190 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0025 --- Epoch 1178 / 1369 - 2811 epochs total Iteration 0, loss = 0.0103 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0043 --- Epoch 1179 / 1369 - 2812 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0124 Iteration 80, loss = 0.0012 --- Epoch 1180 / 1369 - 2813 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0107 --- Epoch 1181 / 1369 - 2814 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0023 --- Epoch 1182 / 1369 - 2815 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0128 --- Epoch 1183 / 1369 - 2816 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0010 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0156 --- Epoch 1184 / 1369 - 2817 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0114 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0015 --- Epoch 1185 / 1369 - 2818 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0008 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0035 --- Epoch 1186 / 1369 - 2819 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0129 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0037 --- Epoch 1187 / 1369 - 2820 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0039 --- Epoch 1188 / 1369 - 2821 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0099 --- Epoch 1189 / 1369 - 2822 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0164 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0032 --- Epoch 1190 / 1369 - 2823 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0015 --- Epoch 1191 / 1369 - 2824 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0085 --- Epoch 1192 / 1369 - 2825 epochs total Iteration 0, loss = 0.0137 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0099 Iteration 80, loss = 0.0008 --- Epoch 1193 / 1369 - 2826 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0014 --- Epoch 1194 / 1369 - 2827 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0056 --- Epoch 1195 / 1369 - 2828 epochs total Iteration 0, loss = 0.0170 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0051 --- Epoch 1196 / 1369 - 2829 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0172 --- Epoch 1197 / 1369 - 2830 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0184 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0028 --- Epoch 1198 / 1369 - 2831 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0029 --- Epoch 1199 / 1369 - 2832 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0038 --- Epoch 1200 / 1369 - 2833 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0057 --- Epoch 1201 / 1369 - 2834 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0065 --- Epoch 1202 / 1369 - 2835 epochs total Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0019 --- Epoch 1203 / 1369 - 2836 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0117 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0020 --- Epoch 1204 / 1369 - 2837 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0145 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0153 --- Epoch 1205 / 1369 - 2838 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0019 --- Epoch 1206 / 1369 - 2839 epochs total Iteration 0, loss = 0.0090 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0061 --- Epoch 1207 / 1369 - 2840 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0311 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0025 --- Epoch 1208 / 1369 - 2841 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0007 Iteration 80, loss = 0.0036 --- Epoch 1209 / 1369 - 2842 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0063 --- Epoch 1210 / 1369 - 2843 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0124 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0050 --- Epoch 1211 / 1369 - 2844 epochs total Iteration 0, loss = 0.0294 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0039 --- Epoch 1212 / 1369 - 2845 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0069 --- Epoch 1213 / 1369 - 2846 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0005 Iteration 40, loss = 0.0162 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0030 --- Epoch 1214 / 1369 - 2847 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0021 --- Epoch 1215 / 1369 - 2848 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0227 --- Epoch 1216 / 1369 - 2849 epochs total Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0319 --- Epoch 1217 / 1369 - 2850 epochs total Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0058 --- Epoch 1218 / 1369 - 2851 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0064 --- Epoch 1219 / 1369 - 2852 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0192 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0018 --- Epoch 1220 / 1369 - 2853 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0022 --- Epoch 1221 / 1369 - 2854 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0023 --- Epoch 1222 / 1369 - 2855 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0096 --- Epoch 1223 / 1369 - 2856 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0114 Iteration 40, loss = 0.0192 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0018 --- Epoch 1224 / 1369 - 2857 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0005 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0031 --- Epoch 1225 / 1369 - 2858 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0081 --- Epoch 1226 / 1369 - 2859 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0039 --- Epoch 1227 / 1369 - 2860 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0006 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0076 --- Epoch 1228 / 1369 - 2861 epochs total Iteration 0, loss = 0.0084 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0020 --- Epoch 1229 / 1369 - 2862 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0054 --- Epoch 1230 / 1369 - 2863 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0069 --- Epoch 1231 / 1369 - 2864 epochs total Iteration 0, loss = 0.0120 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0008 Iteration 80, loss = 0.0020 --- Epoch 1232 / 1369 - 2865 epochs total Iteration 0, loss = 0.0084 Iteration 20, loss = 0.0138 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0055 --- Epoch 1233 / 1369 - 2866 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0025 --- Epoch 1234 / 1369 - 2867 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0007 Iteration 80, loss = 0.0041 --- Epoch 1235 / 1369 - 2868 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0023 --- Epoch 1236 / 1369 - 2869 epochs total Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0016 --- Epoch 1237 / 1369 - 2870 epochs total Iteration 0, loss = 0.0130 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0063 --- Epoch 1238 / 1369 - 2871 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0122 --- Epoch 1239 / 1369 - 2872 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0090 --- Epoch 1240 / 1369 - 2873 epochs total Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0022 --- Epoch 1241 / 1369 - 2874 epochs total Iteration 0, loss = 0.0375 Iteration 20, loss = 0.0085 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0055 --- Epoch 1242 / 1369 - 2875 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0047 --- Epoch 1243 / 1369 - 2876 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0099 --- Epoch 1244 / 1369 - 2877 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0025 --- Epoch 1245 / 1369 - 2878 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0178 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0040 --- Epoch 1246 / 1369 - 2879 epochs total Iteration 0, loss = 0.0252 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0043 --- Epoch 1247 / 1369 - 2880 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0016 --- Epoch 1248 / 1369 - 2881 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0007 Iteration 80, loss = 0.0023 --- Epoch 1249 / 1369 - 2882 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0127 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0068 --- Epoch 1250 / 1369 - 2883 epochs total Iteration 0, loss = 0.0171 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0039 --- Epoch 1251 / 1369 - 2884 epochs total Iteration 0, loss = 0.0070 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0012 --- Epoch 1252 / 1369 - 2885 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0022 --- Epoch 1253 / 1369 - 2886 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0250 Iteration 80, loss = 0.0081 --- Epoch 1254 / 1369 - 2887 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0039 --- Epoch 1255 / 1369 - 2888 epochs total Iteration 0, loss = 0.0135 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0077 --- Epoch 1256 / 1369 - 2889 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0100 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0015 --- Epoch 1257 / 1369 - 2890 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0010 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0024 --- Epoch 1258 / 1369 - 2891 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0009 --- Epoch 1259 / 1369 - 2892 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0024 --- Epoch 1260 / 1369 - 2893 epochs total Iteration 0, loss = 0.0128 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0108 --- Epoch 1261 / 1369 - 2894 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0023 --- Epoch 1262 / 1369 - 2895 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0083 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0052 --- Epoch 1263 / 1369 - 2896 epochs total Iteration 0, loss = 0.0005 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0057 --- Epoch 1264 / 1369 - 2897 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0023 --- Epoch 1265 / 1369 - 2898 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0264 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0151 Iteration 80, loss = 0.0028 --- Epoch 1266 / 1369 - 2899 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0034 --- Epoch 1267 / 1369 - 2900 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0034 --- Epoch 1268 / 1369 - 2901 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0056 --- Epoch 1269 / 1369 - 2902 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0031 --- Epoch 1270 / 1369 - 2903 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0095 --- Epoch 1271 / 1369 - 2904 epochs total Iteration 0, loss = 0.0210 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0005 Iteration 80, loss = 0.0009 --- Epoch 1272 / 1369 - 2905 epochs total Iteration 0, loss = 0.0149 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0058 --- Epoch 1273 / 1369 - 2906 epochs total Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0093 --- Epoch 1274 / 1369 - 2907 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0102 --- Epoch 1275 / 1369 - 2908 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0031 --- Epoch 1276 / 1369 - 2909 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0026 --- Epoch 1277 / 1369 - 2910 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0100 --- Epoch 1278 / 1369 - 2911 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0041 --- Epoch 1279 / 1369 - 2912 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0138 --- Epoch 1280 / 1369 - 2913 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0022 --- Epoch 1281 / 1369 - 2914 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0015 --- Epoch 1282 / 1369 - 2915 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0129 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0050 --- Epoch 1283 / 1369 - 2916 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0178 Iteration 80, loss = 0.0023 --- Epoch 1284 / 1369 - 2917 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0090 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0012 --- Epoch 1285 / 1369 - 2918 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0132 Iteration 60, loss = 0.0008 Iteration 80, loss = 0.0156 --- Epoch 1286 / 1369 - 2919 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0049 --- Epoch 1287 / 1369 - 2920 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0375 Iteration 40, loss = 0.0141 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0017 --- Epoch 1288 / 1369 - 2921 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0035 --- Epoch 1289 / 1369 - 2922 epochs total Iteration 0, loss = 0.0149 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0024 --- Epoch 1290 / 1369 - 2923 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0040 --- Epoch 1291 / 1369 - 2924 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0044 --- Epoch 1292 / 1369 - 2925 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0024 --- Epoch 1293 / 1369 - 2926 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0024 --- Epoch 1294 / 1369 - 2927 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0033 --- Epoch 1295 / 1369 - 2928 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0131 --- Epoch 1296 / 1369 - 2929 epochs total Iteration 0, loss = 0.0127 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0015 --- Epoch 1297 / 1369 - 2930 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0037 --- Epoch 1298 / 1369 - 2931 epochs total Iteration 0, loss = 0.0131 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0099 Iteration 80, loss = 0.0053 --- Epoch 1299 / 1369 - 2932 epochs total Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0170 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0009 Iteration 80, loss = 0.0087 --- Epoch 1300 / 1369 - 2933 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0132 --- Epoch 1301 / 1369 - 2934 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0081 Iteration 60, loss = 0.0010 Iteration 80, loss = 0.0021 --- Epoch 1302 / 1369 - 2935 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0173 Iteration 80, loss = 0.0059 --- Epoch 1303 / 1369 - 2936 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0150 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0041 --- Epoch 1304 / 1369 - 2937 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0051 --- Epoch 1305 / 1369 - 2938 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0025 --- Epoch 1306 / 1369 - 2939 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0033 --- Epoch 1307 / 1369 - 2940 epochs total Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0140 Iteration 80, loss = 0.0056 --- Epoch 1308 / 1369 - 2941 epochs total Iteration 0, loss = 0.0013 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0029 --- Epoch 1309 / 1369 - 2942 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0410 Iteration 80, loss = 0.0018 --- Epoch 1310 / 1369 - 2943 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0010 Iteration 80, loss = 0.0051 --- Epoch 1311 / 1369 - 2944 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0022 --- Epoch 1312 / 1369 - 2945 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0041 --- Epoch 1313 / 1369 - 2946 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0030 --- Epoch 1314 / 1369 - 2947 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0012 --- Epoch 1315 / 1369 - 2948 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0019 --- Epoch 1316 / 1369 - 2949 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0087 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0125 Iteration 80, loss = 0.0093 --- Epoch 1317 / 1369 - 2950 epochs total Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0028 --- Epoch 1318 / 1369 - 2951 epochs total Iteration 0, loss = 0.0208 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0012 --- Epoch 1319 / 1369 - 2952 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0099 Iteration 80, loss = 0.0016 --- Epoch 1320 / 1369 - 2953 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0090 Iteration 40, loss = 0.0071 Iteration 60, loss = 0.0010 Iteration 80, loss = 0.0014 --- Epoch 1321 / 1369 - 2954 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0029 --- Epoch 1322 / 1369 - 2955 epochs total Iteration 0, loss = 0.0100 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0031 --- Epoch 1323 / 1369 - 2956 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0010 Iteration 80, loss = 0.0069 --- Epoch 1324 / 1369 - 2957 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0070 --- Epoch 1325 / 1369 - 2958 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0183 --- Epoch 1326 / 1369 - 2959 epochs total Iteration 0, loss = 0.0007 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0064 --- Epoch 1327 / 1369 - 2960 epochs total Iteration 0, loss = 0.0145 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0034 --- Epoch 1328 / 1369 - 2961 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0280 --- Epoch 1329 / 1369 - 2962 epochs total Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0025 --- Epoch 1330 / 1369 - 2963 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0508 Iteration 80, loss = 0.0051 --- Epoch 1331 / 1369 - 2964 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0009 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0011 --- Epoch 1332 / 1369 - 2965 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0020 --- Epoch 1333 / 1369 - 2966 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0049 --- Epoch 1334 / 1369 - 2967 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0123 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0018 --- Epoch 1335 / 1369 - 2968 epochs total Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0031 --- Epoch 1336 / 1369 - 2969 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0026 --- Epoch 1337 / 1369 - 2970 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0010 Iteration 80, loss = 0.0015 --- Epoch 1338 / 1369 - 2971 epochs total Iteration 0, loss = 0.0010 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0150 Iteration 60, loss = 0.0009 Iteration 80, loss = 0.0059 --- Epoch 1339 / 1369 - 2972 epochs total Iteration 0, loss = 0.0104 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0013 --- Epoch 1340 / 1369 - 2973 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0022 --- Epoch 1341 / 1369 - 2974 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0012 --- Epoch 1342 / 1369 - 2975 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0081 --- Epoch 1343 / 1369 - 2976 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0157 --- Epoch 1344 / 1369 - 2977 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0038 --- Epoch 1345 / 1369 - 2978 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0010 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0007 Iteration 80, loss = 0.0013 --- Epoch 1346 / 1369 - 2979 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0102 --- Epoch 1347 / 1369 - 2980 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0057 --- Epoch 1348 / 1369 - 2981 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0121 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0195 --- Epoch 1349 / 1369 - 2982 epochs total Iteration 0, loss = 0.0009 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0050 --- Epoch 1350 / 1369 - 2983 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0132 --- Epoch 1351 / 1369 - 2984 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0033 --- Epoch 1352 / 1369 - 2985 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0188 Iteration 80, loss = 0.0028 --- Epoch 1353 / 1369 - 2986 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0010 Iteration 40, loss = 0.0090 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0030 --- Epoch 1354 / 1369 - 2987 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0062 --- Epoch 1355 / 1369 - 2988 epochs total Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0185 Iteration 60, loss = 0.0005 Iteration 80, loss = 0.0044 --- Epoch 1356 / 1369 - 2989 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0067 --- Epoch 1357 / 1369 - 2990 epochs total Iteration 0, loss = 0.0173 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0011 --- Epoch 1358 / 1369 - 2991 epochs total Iteration 0, loss = 0.0151 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0026 --- Epoch 1359 / 1369 - 2992 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0414 Iteration 80, loss = 0.0047 --- Epoch 1360 / 1369 - 2993 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0156 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0104 --- Epoch 1361 / 1369 - 2994 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0033 --- Epoch 1362 / 1369 - 2995 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0016 --- Epoch 1363 / 1369 - 2996 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0090 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0121 --- Epoch 1364 / 1369 - 2997 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0138 Iteration 80, loss = 0.0033 --- Epoch 1365 / 1369 - 2998 epochs total Iteration 0, loss = 0.0127 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0107 --- Epoch 1366 / 1369 - 2999 epochs total Iteration 0, loss = 0.0120 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0081 --- Epoch 1367 / 1369 - 3000 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0154 Iteration 80, loss = 0.0058 --- Epoch 1368 / 1369 - 3001 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0190 Iteration 80, loss = 0.0012 --- Epoch 1369 / 1369 - 3002 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0021
testModel(model13, x_test=data["X_test_truck"], y_test=data["y_test_truck"], criterion=nn.MSELoss())
learning_rate = 1e-2
model14 = ConvNet4()
optimizer = optim.SGD(model14.parameters(), lr=learning_rate)
train(model14, optimizer, epochs=100000, x_train=data["X_train"], y_train=data["y_train"], criterion=nn.MSELoss())
--- Epoch 1 / 100000 - 2449 epochs total Iteration 0, loss = 0.0090 Iteration 20, loss = 0.0238 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0043 --- Epoch 2 / 100000 - 2450 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0187 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0032 --- Epoch 3 / 100000 - 2451 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0462 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0043 --- Epoch 4 / 100000 - 2452 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0051 --- Epoch 5 / 100000 - 2453 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0011 Iteration 80, loss = 0.0027 --- Epoch 6 / 100000 - 2454 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0065 --- Epoch 7 / 100000 - 2455 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0129 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0023 --- Epoch 8 / 100000 - 2456 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0051 --- Epoch 9 / 100000 - 2457 epochs total Iteration 0, loss = 0.0193 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0148 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0173 --- Epoch 10 / 100000 - 2458 epochs total Iteration 0, loss = 0.0123 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0032 --- Epoch 11 / 100000 - 2459 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0248 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0337 --- Epoch 12 / 100000 - 2460 epochs total Iteration 0, loss = 0.0199 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0116 Iteration 80, loss = 0.0380 --- Epoch 13 / 100000 - 2461 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0168 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0108 --- Epoch 14 / 100000 - 2462 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0037 --- Epoch 15 / 100000 - 2463 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0187 Iteration 40, loss = 0.0193 Iteration 60, loss = 0.0126 Iteration 80, loss = 0.0161 --- Epoch 16 / 100000 - 2464 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0331 Iteration 80, loss = 0.0037 --- Epoch 17 / 100000 - 2465 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0191 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0052 --- Epoch 18 / 100000 - 2466 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0207 --- Epoch 19 / 100000 - 2467 epochs total Iteration 0, loss = 0.0358 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0040 --- Epoch 20 / 100000 - 2468 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0132 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0138 --- Epoch 21 / 100000 - 2469 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0265 Iteration 80, loss = 0.0090 --- Epoch 22 / 100000 - 2470 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0025 --- Epoch 23 / 100000 - 2471 epochs total Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0087 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0334 --- Epoch 24 / 100000 - 2472 epochs total Iteration 0, loss = 0.0155 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0040 --- Epoch 25 / 100000 - 2473 epochs total Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0064 --- Epoch 26 / 100000 - 2474 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0032 --- Epoch 27 / 100000 - 2475 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0144 --- Epoch 28 / 100000 - 2476 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0090 --- Epoch 29 / 100000 - 2477 epochs total Iteration 0, loss = 0.0334 Iteration 20, loss = 0.0195 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0272 Iteration 80, loss = 0.0018 --- Epoch 30 / 100000 - 2478 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0206 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0050 --- Epoch 31 / 100000 - 2479 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0120 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0134 --- Epoch 32 / 100000 - 2480 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0133 Iteration 80, loss = 0.0033 --- Epoch 33 / 100000 - 2481 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0357 Iteration 40, loss = 0.0198 Iteration 60, loss = 0.0373 Iteration 80, loss = 0.0118 --- Epoch 34 / 100000 - 2482 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0108 Iteration 40, loss = 0.0309 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0014 --- Epoch 35 / 100000 - 2483 epochs total Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0142 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0043 --- Epoch 36 / 100000 - 2484 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0195 Iteration 80, loss = 0.0019 --- Epoch 37 / 100000 - 2485 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0031 --- Epoch 38 / 100000 - 2486 epochs total Iteration 0, loss = 0.0130 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0075 --- Epoch 39 / 100000 - 2487 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0112 Iteration 40, loss = 0.0202 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0107 --- Epoch 40 / 100000 - 2488 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0103 --- Epoch 41 / 100000 - 2489 epochs total Iteration 0, loss = 0.0153 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0050 --- Epoch 42 / 100000 - 2490 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0135 --- Epoch 43 / 100000 - 2491 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0116 Iteration 80, loss = 0.0367 --- Epoch 44 / 100000 - 2492 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0039 --- Epoch 45 / 100000 - 2493 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0342 Iteration 80, loss = 0.0319 --- Epoch 46 / 100000 - 2494 epochs total Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0048 --- Epoch 47 / 100000 - 2495 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0291 Iteration 80, loss = 0.0039 --- Epoch 48 / 100000 - 2496 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0220 Iteration 60, loss = 0.0108 Iteration 80, loss = 0.0243 --- Epoch 49 / 100000 - 2497 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0150 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0418 Iteration 80, loss = 0.0075 --- Epoch 50 / 100000 - 2498 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0141 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0037 --- Epoch 51 / 100000 - 2499 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0141 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0024 --- Epoch 52 / 100000 - 2500 epochs total Iteration 0, loss = 0.0185 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0354 Iteration 60, loss = 0.0471 Iteration 80, loss = 0.0094 --- Epoch 53 / 100000 - 2501 epochs total Iteration 0, loss = 0.0082 Iteration 20, loss = 0.0901 Iteration 40, loss = 0.0232 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0045 --- Epoch 54 / 100000 - 2502 epochs total Iteration 0, loss = 0.0148 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0088 --- Epoch 55 / 100000 - 2503 epochs total Iteration 0, loss = 0.0123 Iteration 20, loss = 0.0128 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0186 --- Epoch 56 / 100000 - 2504 epochs total Iteration 0, loss = 0.0333 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0191 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0087 --- Epoch 57 / 100000 - 2505 epochs total Iteration 0, loss = 0.0469 Iteration 20, loss = 0.0514 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0114 --- Epoch 58 / 100000 - 2506 epochs total Iteration 0, loss = 0.0097 Iteration 20, loss = 0.0096 Iteration 40, loss = 0.0184 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0106 --- Epoch 59 / 100000 - 2507 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0821 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0029 --- Epoch 60 / 100000 - 2508 epochs total Iteration 0, loss = 0.0290 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0018 --- Epoch 61 / 100000 - 2509 epochs total Iteration 0, loss = 0.0147 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0378 Iteration 80, loss = 0.0080 --- Epoch 62 / 100000 - 2510 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0657 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0156 --- Epoch 63 / 100000 - 2511 epochs total Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0045 --- Epoch 64 / 100000 - 2512 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0237 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0165 --- Epoch 65 / 100000 - 2513 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0185 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0038 --- Epoch 66 / 100000 - 2514 epochs total Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0181 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0041 --- Epoch 67 / 100000 - 2515 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0023 --- Epoch 68 / 100000 - 2516 epochs total Iteration 0, loss = 0.0174 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0533 --- Epoch 69 / 100000 - 2517 epochs total Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0491 --- Epoch 70 / 100000 - 2518 epochs total Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0379 --- Epoch 71 / 100000 - 2519 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0396 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0107 --- Epoch 72 / 100000 - 2520 epochs total Iteration 0, loss = 0.0333 Iteration 20, loss = 0.0150 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0052 --- Epoch 73 / 100000 - 2521 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0050 --- Epoch 74 / 100000 - 2522 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0277 Iteration 80, loss = 0.0069 --- Epoch 75 / 100000 - 2523 epochs total Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0062 --- Epoch 76 / 100000 - 2524 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0205 Iteration 80, loss = 0.0122 --- Epoch 77 / 100000 - 2525 epochs total Iteration 0, loss = 0.0284 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0034 --- Epoch 78 / 100000 - 2526 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0333 Iteration 80, loss = 0.0034 --- Epoch 79 / 100000 - 2527 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0071 --- Epoch 80 / 100000 - 2528 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0450 --- Epoch 81 / 100000 - 2529 epochs total Iteration 0, loss = 0.0129 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0059 --- Epoch 82 / 100000 - 2530 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0266 Iteration 80, loss = 0.0061 --- Epoch 83 / 100000 - 2531 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0173 Iteration 80, loss = 0.0150 --- Epoch 84 / 100000 - 2532 epochs total Iteration 0, loss = 0.0147 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0043 --- Epoch 85 / 100000 - 2533 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0523 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0030 --- Epoch 86 / 100000 - 2534 epochs total Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0144 Iteration 40, loss = 0.0357 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0248 --- Epoch 87 / 100000 - 2535 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0148 Iteration 60, loss = 0.0101 Iteration 80, loss = 0.0087 --- Epoch 88 / 100000 - 2536 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0040 --- Epoch 89 / 100000 - 2537 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0122 --- Epoch 90 / 100000 - 2538 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0286 Iteration 60, loss = 0.0124 Iteration 80, loss = 0.0071 --- Epoch 91 / 100000 - 2539 epochs total Iteration 0, loss = 0.0206 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0010 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0039 --- Epoch 92 / 100000 - 2540 epochs total Iteration 0, loss = 0.0085 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0118 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0051 --- Epoch 93 / 100000 - 2541 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0108 --- Epoch 94 / 100000 - 2542 epochs total Iteration 0, loss = 0.0291 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0165 --- Epoch 95 / 100000 - 2543 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0238 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0091 --- Epoch 96 / 100000 - 2544 epochs total Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0271 Iteration 80, loss = 0.0170 --- Epoch 97 / 100000 - 2545 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0109 Iteration 40, loss = 0.0168 Iteration 60, loss = 0.0124 Iteration 80, loss = 0.0127 --- Epoch 98 / 100000 - 2546 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0231 --- Epoch 99 / 100000 - 2547 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0124 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0345 Iteration 80, loss = 0.0081 --- Epoch 100 / 100000 - 2548 epochs total Iteration 0, loss = 0.0104 Iteration 20, loss = 0.0147 Iteration 40, loss = 0.0139 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0200 --- Epoch 101 / 100000 - 2549 epochs total Iteration 0, loss = 0.0126 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0228 Iteration 80, loss = 0.0025 --- Epoch 102 / 100000 - 2550 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0049 --- Epoch 103 / 100000 - 2551 epochs total Iteration 0, loss = 0.0551 Iteration 20, loss = 0.0126 Iteration 40, loss = 0.0089 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0013 --- Epoch 104 / 100000 - 2552 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0227 Iteration 80, loss = 0.0034 --- Epoch 105 / 100000 - 2553 epochs total Iteration 0, loss = 0.0280 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0038 --- Epoch 106 / 100000 - 2554 epochs total Iteration 0, loss = 0.0084 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0026 --- Epoch 107 / 100000 - 2555 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0336 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0066 --- Epoch 108 / 100000 - 2556 epochs total Iteration 0, loss = 0.0235 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0079 --- Epoch 109 / 100000 - 2557 epochs total Iteration 0, loss = 0.0010 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0020 --- Epoch 110 / 100000 - 2558 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0197 Iteration 60, loss = 0.0096 Iteration 80, loss = 0.0103 --- Epoch 111 / 100000 - 2559 epochs total Iteration 0, loss = 0.0103 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0077 --- Epoch 112 / 100000 - 2560 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0108 Iteration 60, loss = 0.0085 Iteration 80, loss = 0.0104 --- Epoch 113 / 100000 - 2561 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0259 Iteration 80, loss = 0.0112 --- Epoch 114 / 100000 - 2562 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0135 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0110 --- Epoch 115 / 100000 - 2563 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0029 --- Epoch 116 / 100000 - 2564 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0010 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0114 --- Epoch 117 / 100000 - 2565 epochs total Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0159 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0008 --- Epoch 118 / 100000 - 2566 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0147 --- Epoch 119 / 100000 - 2567 epochs total Iteration 0, loss = 0.0124 Iteration 20, loss = 0.0259 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0127 Iteration 80, loss = 0.0035 --- Epoch 120 / 100000 - 2568 epochs total Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0304 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0155 Iteration 80, loss = 0.0150 --- Epoch 121 / 100000 - 2569 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0140 --- Epoch 122 / 100000 - 2570 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0451 Iteration 40, loss = 0.0242 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0050 --- Epoch 123 / 100000 - 2571 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0404 Iteration 80, loss = 0.0134 --- Epoch 124 / 100000 - 2572 epochs total Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0158 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0049 --- Epoch 125 / 100000 - 2573 epochs total Iteration 0, loss = 0.0368 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0142 Iteration 80, loss = 0.0121 --- Epoch 126 / 100000 - 2574 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0083 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0070 --- Epoch 127 / 100000 - 2575 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0305 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0311 Iteration 80, loss = 0.0091 --- Epoch 128 / 100000 - 2576 epochs total Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0350 Iteration 40, loss = 0.0114 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0156 --- Epoch 129 / 100000 - 2577 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0180 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0007 Iteration 80, loss = 0.0040 --- Epoch 130 / 100000 - 2578 epochs total Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0304 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0099 --- Epoch 131 / 100000 - 2579 epochs total Iteration 0, loss = 0.0191 Iteration 20, loss = 0.0172 Iteration 40, loss = 0.0193 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0138 --- Epoch 132 / 100000 - 2580 epochs total Iteration 0, loss = 0.0413 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0062 --- Epoch 133 / 100000 - 2581 epochs total Iteration 0, loss = 0.0084 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0085 Iteration 80, loss = 0.0043 --- Epoch 134 / 100000 - 2582 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0033 --- Epoch 135 / 100000 - 2583 epochs total Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0089 --- Epoch 136 / 100000 - 2584 epochs total Iteration 0, loss = 0.0141 Iteration 20, loss = 0.0158 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0045 --- Epoch 137 / 100000 - 2585 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0191 --- Epoch 138 / 100000 - 2586 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0126 --- Epoch 139 / 100000 - 2587 epochs total Iteration 0, loss = 0.0240 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0126 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0046 --- Epoch 140 / 100000 - 2588 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0111 --- Epoch 141 / 100000 - 2589 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0599 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0042 --- Epoch 142 / 100000 - 2590 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0215 Iteration 40, loss = 0.0090 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0127 --- Epoch 143 / 100000 - 2591 epochs total Iteration 0, loss = 0.0191 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0011 --- Epoch 144 / 100000 - 2592 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0031 --- Epoch 145 / 100000 - 2593 epochs total Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0166 Iteration 80, loss = 0.0050 --- Epoch 146 / 100000 - 2594 epochs total Iteration 0, loss = 0.0246 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0152 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0026 --- Epoch 147 / 100000 - 2595 epochs total Iteration 0, loss = 0.0312 Iteration 20, loss = 0.0207 Iteration 40, loss = 0.0206 Iteration 60, loss = 0.0185 Iteration 80, loss = 0.0488 --- Epoch 148 / 100000 - 2596 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0988 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0150 Iteration 80, loss = 0.0103 --- Epoch 149 / 100000 - 2597 epochs total Iteration 0, loss = 0.0154 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0030 --- Epoch 150 / 100000 - 2598 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0419 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0169 --- Epoch 151 / 100000 - 2599 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0146 Iteration 60, loss = 0.0183 Iteration 80, loss = 0.0034 --- Epoch 152 / 100000 - 2600 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0060 --- Epoch 153 / 100000 - 2601 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0162 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0062 --- Epoch 154 / 100000 - 2602 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0231 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0421 Iteration 80, loss = 0.0150 --- Epoch 155 / 100000 - 2603 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0038 --- Epoch 156 / 100000 - 2604 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0379 Iteration 80, loss = 0.0042 --- Epoch 157 / 100000 - 2605 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0132 --- Epoch 158 / 100000 - 2606 epochs total Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0169 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0022 --- Epoch 159 / 100000 - 2607 epochs total Iteration 0, loss = 0.0321 Iteration 20, loss = 0.0136 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0224 Iteration 80, loss = 0.0124 --- Epoch 160 / 100000 - 2608 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0309 Iteration 60, loss = 0.0282 Iteration 80, loss = 0.0080 --- Epoch 161 / 100000 - 2609 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0152 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0031 --- Epoch 162 / 100000 - 2610 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0087 --- Epoch 163 / 100000 - 2611 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0329 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0044 --- Epoch 164 / 100000 - 2612 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0233 Iteration 60, loss = 0.0124 Iteration 80, loss = 0.0313 --- Epoch 165 / 100000 - 2613 epochs total Iteration 0, loss = 0.0309 Iteration 20, loss = 0.0140 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0099 --- Epoch 166 / 100000 - 2614 epochs total Iteration 0, loss = 0.0363 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0155 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0023 --- Epoch 167 / 100000 - 2615 epochs total Iteration 0, loss = 0.0149 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0056 --- Epoch 168 / 100000 - 2616 epochs total Iteration 0, loss = 0.0224 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0141 Iteration 60, loss = 0.0299 Iteration 80, loss = 0.0073 --- Epoch 169 / 100000 - 2617 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0365 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0136 Iteration 80, loss = 0.0124 --- Epoch 170 / 100000 - 2618 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0009 --- Epoch 171 / 100000 - 2619 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0175 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0009 --- Epoch 172 / 100000 - 2620 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0050 --- Epoch 173 / 100000 - 2621 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0210 Iteration 80, loss = 0.0061 --- Epoch 174 / 100000 - 2622 epochs total Iteration 0, loss = 0.0070 Iteration 20, loss = 0.0183 Iteration 40, loss = 0.0128 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0039 --- Epoch 175 / 100000 - 2623 epochs total Iteration 0, loss = 0.0300 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0041 --- Epoch 176 / 100000 - 2624 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0348 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0083 --- Epoch 177 / 100000 - 2625 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0034 --- Epoch 178 / 100000 - 2626 epochs total Iteration 0, loss = 0.0085 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0035 --- Epoch 179 / 100000 - 2627 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0367 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0092 --- Epoch 180 / 100000 - 2628 epochs total Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0062 --- Epoch 181 / 100000 - 2629 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0482 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0096 --- Epoch 182 / 100000 - 2630 epochs total Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0038 --- Epoch 183 / 100000 - 2631 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0196 Iteration 80, loss = 0.0019 --- Epoch 184 / 100000 - 2632 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0043 --- Epoch 185 / 100000 - 2633 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0123 --- Epoch 186 / 100000 - 2634 epochs total Iteration 0, loss = 0.0289 Iteration 20, loss = 0.0132 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0052 --- Epoch 187 / 100000 - 2635 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0101 Iteration 80, loss = 0.0060 --- Epoch 188 / 100000 - 2636 epochs total Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0047 --- Epoch 189 / 100000 - 2637 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0196 --- Epoch 190 / 100000 - 2638 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0279 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0037 --- Epoch 191 / 100000 - 2639 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0423 Iteration 40, loss = 0.0209 Iteration 60, loss = 0.0097 Iteration 80, loss = 0.1049 --- Epoch 192 / 100000 - 2640 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0185 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0057 --- Epoch 193 / 100000 - 2641 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0201 Iteration 40, loss = 0.0114 Iteration 60, loss = 0.0145 Iteration 80, loss = 0.0033 --- Epoch 194 / 100000 - 2642 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0142 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0084 --- Epoch 195 / 100000 - 2643 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0324 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0220 --- Epoch 196 / 100000 - 2644 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0106 Iteration 60, loss = 0.0169 Iteration 80, loss = 0.0174 --- Epoch 197 / 100000 - 2645 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0165 Iteration 60, loss = 0.0143 Iteration 80, loss = 0.0146 --- Epoch 198 / 100000 - 2646 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0123 Iteration 80, loss = 0.0037 --- Epoch 199 / 100000 - 2647 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0185 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0021 --- Epoch 200 / 100000 - 2648 epochs total Iteration 0, loss = 0.0147 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0191 --- Epoch 201 / 100000 - 2649 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0157 --- Epoch 202 / 100000 - 2650 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0117 Iteration 40, loss = 0.0250 Iteration 60, loss = 0.0270 Iteration 80, loss = 0.0079 --- Epoch 203 / 100000 - 2651 epochs total Iteration 0, loss = 0.0422 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0088 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0188 --- Epoch 204 / 100000 - 2652 epochs total Iteration 0, loss = 0.0251 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0181 Iteration 80, loss = 0.0147 --- Epoch 205 / 100000 - 2653 epochs total Iteration 0, loss = 0.0438 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0122 --- Epoch 206 / 100000 - 2654 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0672 Iteration 60, loss = 0.0146 Iteration 80, loss = 0.0047 --- Epoch 207 / 100000 - 2655 epochs total Iteration 0, loss = 0.0101 Iteration 20, loss = 0.0507 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0037 --- Epoch 208 / 100000 - 2656 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0136 Iteration 80, loss = 0.0029 --- Epoch 209 / 100000 - 2657 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0039 --- Epoch 210 / 100000 - 2658 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0096 Iteration 80, loss = 0.0058 --- Epoch 211 / 100000 - 2659 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0181 Iteration 40, loss = 0.0124 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0688 --- Epoch 212 / 100000 - 2660 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0180 Iteration 60, loss = 0.0139 Iteration 80, loss = 0.0206 --- Epoch 213 / 100000 - 2661 epochs total Iteration 0, loss = 0.0346 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0114 Iteration 80, loss = 0.0211 --- Epoch 214 / 100000 - 2662 epochs total Iteration 0, loss = 0.0155 Iteration 20, loss = 0.0299 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0096 Iteration 80, loss = 0.0107 --- Epoch 215 / 100000 - 2663 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0243 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0016 --- Epoch 216 / 100000 - 2664 epochs total Iteration 0, loss = 0.0110 Iteration 20, loss = 0.0201 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0179 --- Epoch 217 / 100000 - 2665 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0210 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0035 --- Epoch 218 / 100000 - 2666 epochs total Iteration 0, loss = 0.0169 Iteration 20, loss = 0.0126 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0118 --- Epoch 219 / 100000 - 2667 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0136 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0019 --- Epoch 220 / 100000 - 2668 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0880 Iteration 40, loss = 0.0090 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0063 --- Epoch 221 / 100000 - 2669 epochs total Iteration 0, loss = 0.0369 Iteration 20, loss = 0.0123 Iteration 40, loss = 0.0636 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0090 --- Epoch 222 / 100000 - 2670 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0158 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0237 Iteration 80, loss = 0.0056 --- Epoch 223 / 100000 - 2671 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0086 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0090 --- Epoch 224 / 100000 - 2672 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0159 Iteration 40, loss = 0.0164 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0979 --- Epoch 225 / 100000 - 2673 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0238 Iteration 60, loss = 0.0329 Iteration 80, loss = 0.0119 --- Epoch 226 / 100000 - 2674 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0083 Iteration 60, loss = 0.0097 Iteration 80, loss = 0.0104 --- Epoch 227 / 100000 - 2675 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0317 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0254 Iteration 80, loss = 0.0030 --- Epoch 228 / 100000 - 2676 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0119 --- Epoch 229 / 100000 - 2677 epochs total Iteration 0, loss = 0.0358 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0249 Iteration 80, loss = 0.0260 --- Epoch 230 / 100000 - 2678 epochs total Iteration 0, loss = 0.0333 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0145 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0051 --- Epoch 231 / 100000 - 2679 epochs total Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0153 Iteration 40, loss = 0.0158 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0017 --- Epoch 232 / 100000 - 2680 epochs total Iteration 0, loss = 0.0517 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0180 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0047 --- Epoch 233 / 100000 - 2681 epochs total Iteration 0, loss = 0.0085 Iteration 20, loss = 0.0223 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0162 --- Epoch 234 / 100000 - 2682 epochs total Iteration 0, loss = 0.0179 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0123 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0206 --- Epoch 235 / 100000 - 2683 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0247 Iteration 40, loss = 0.0144 Iteration 60, loss = 0.0168 Iteration 80, loss = 0.0036 --- Epoch 236 / 100000 - 2684 epochs total Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0125 Iteration 80, loss = 0.0191 --- Epoch 237 / 100000 - 2685 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0090 --- Epoch 238 / 100000 - 2686 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0137 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0024 --- Epoch 239 / 100000 - 2687 epochs total Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0097 Iteration 80, loss = 0.0071 --- Epoch 240 / 100000 - 2688 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0131 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0081 --- Epoch 241 / 100000 - 2689 epochs total Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0043 --- Epoch 242 / 100000 - 2690 epochs total Iteration 0, loss = 0.0153 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0124 Iteration 60, loss = 0.0234 Iteration 80, loss = 0.0105 --- Epoch 243 / 100000 - 2691 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0090 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0052 --- Epoch 244 / 100000 - 2692 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0027 --- Epoch 245 / 100000 - 2693 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0165 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0233 --- Epoch 246 / 100000 - 2694 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0245 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0224 --- Epoch 247 / 100000 - 2695 epochs total Iteration 0, loss = 0.0151 Iteration 20, loss = 0.0147 Iteration 40, loss = 0.0955 Iteration 60, loss = 0.0218 Iteration 80, loss = 0.0178 --- Epoch 248 / 100000 - 2696 epochs total Iteration 0, loss = 0.0084 Iteration 20, loss = 0.0193 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0162 Iteration 80, loss = 0.0056 --- Epoch 249 / 100000 - 2697 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0080 --- Epoch 250 / 100000 - 2698 epochs total Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0110 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0526 --- Epoch 251 / 100000 - 2699 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0036 --- Epoch 252 / 100000 - 2700 epochs total Iteration 0, loss = 0.0276 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0032 --- Epoch 253 / 100000 - 2701 epochs total Iteration 0, loss = 0.0232 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0062 --- Epoch 254 / 100000 - 2702 epochs total Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0191 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0044 --- Epoch 255 / 100000 - 2703 epochs total Iteration 0, loss = 0.0131 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0036 --- Epoch 256 / 100000 - 2704 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0305 Iteration 80, loss = 0.0095 --- Epoch 257 / 100000 - 2705 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0132 Iteration 40, loss = 0.0093 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0158 --- Epoch 258 / 100000 - 2706 epochs total Iteration 0, loss = 0.0179 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0311 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0134 --- Epoch 259 / 100000 - 2707 epochs total Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0042 --- Epoch 260 / 100000 - 2708 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0085 Iteration 80, loss = 0.0041 --- Epoch 261 / 100000 - 2709 epochs total Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0108 Iteration 80, loss = 0.0081 --- Epoch 262 / 100000 - 2710 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0062 --- Epoch 263 / 100000 - 2711 epochs total Iteration 0, loss = 0.0113 Iteration 20, loss = 0.0065 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0150 Iteration 80, loss = 0.0147 --- Epoch 264 / 100000 - 2712 epochs total Iteration 0, loss = 0.0580 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0121 Iteration 60, loss = 0.0184 Iteration 80, loss = 0.0272 --- Epoch 265 / 100000 - 2713 epochs total Iteration 0, loss = 0.0591 Iteration 20, loss = 0.0453 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0201 Iteration 80, loss = 0.0517 --- Epoch 266 / 100000 - 2714 epochs total Iteration 0, loss = 0.0177 Iteration 20, loss = 0.0207 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0020 --- Epoch 267 / 100000 - 2715 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0248 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0129 --- Epoch 268 / 100000 - 2716 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0115 Iteration 80, loss = 0.0070 --- Epoch 269 / 100000 - 2717 epochs total Iteration 0, loss = 0.0051 Iteration 20, loss = 0.0251 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0114 Iteration 80, loss = 0.0372 --- Epoch 270 / 100000 - 2718 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0170 Iteration 80, loss = 0.0291 --- Epoch 271 / 100000 - 2719 epochs total Iteration 0, loss = 0.0201 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0268 Iteration 80, loss = 0.0028 --- Epoch 272 / 100000 - 2720 epochs total Iteration 0, loss = 0.0219 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0334 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0114 --- Epoch 273 / 100000 - 2721 epochs total Iteration 0, loss = 0.0390 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0115 Iteration 80, loss = 0.0174 --- Epoch 274 / 100000 - 2722 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0012 --- Epoch 275 / 100000 - 2723 epochs total Iteration 0, loss = 0.0190 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0306 --- Epoch 276 / 100000 - 2724 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0038 --- Epoch 277 / 100000 - 2725 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0147 Iteration 40, loss = 0.0140 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0133 --- Epoch 278 / 100000 - 2726 epochs total Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0202 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0024 --- Epoch 279 / 100000 - 2727 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0266 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0154 Iteration 80, loss = 0.0042 --- Epoch 280 / 100000 - 2728 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0350 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0351 Iteration 80, loss = 0.0012 --- Epoch 281 / 100000 - 2729 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0039 --- Epoch 282 / 100000 - 2730 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0187 Iteration 80, loss = 0.0075 --- Epoch 283 / 100000 - 2731 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0162 Iteration 40, loss = 0.0090 Iteration 60, loss = 0.0144 Iteration 80, loss = 0.0141 --- Epoch 284 / 100000 - 2732 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0251 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0058 --- Epoch 285 / 100000 - 2733 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0034 --- Epoch 286 / 100000 - 2734 epochs total Iteration 0, loss = 0.0376 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0156 --- Epoch 287 / 100000 - 2735 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0117 Iteration 80, loss = 0.0027 --- Epoch 288 / 100000 - 2736 epochs total Iteration 0, loss = 0.0100 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0189 Iteration 60, loss = 0.0123 Iteration 80, loss = 0.0057 --- Epoch 289 / 100000 - 2737 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0172 --- Epoch 290 / 100000 - 2738 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0222 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0234 Iteration 80, loss = 0.0126 --- Epoch 291 / 100000 - 2739 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0109 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0099 --- Epoch 292 / 100000 - 2740 epochs total Iteration 0, loss = 0.0139 Iteration 20, loss = 0.0235 Iteration 40, loss = 0.0124 Iteration 60, loss = 0.0011 Iteration 80, loss = 0.0080 --- Epoch 293 / 100000 - 2741 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0374 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0067 --- Epoch 294 / 100000 - 2742 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0257 Iteration 80, loss = 0.0092 --- Epoch 295 / 100000 - 2743 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0110 Iteration 60, loss = 0.0115 Iteration 80, loss = 0.0132 --- Epoch 296 / 100000 - 2744 epochs total Iteration 0, loss = 0.0178 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0076 --- Epoch 297 / 100000 - 2745 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0144 --- Epoch 298 / 100000 - 2746 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0045 --- Epoch 299 / 100000 - 2747 epochs total Iteration 0, loss = 0.0130 Iteration 20, loss = 0.0122 Iteration 40, loss = 0.0305 Iteration 60, loss = 0.0097 Iteration 80, loss = 0.0225 --- Epoch 300 / 100000 - 2748 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0116 --- Epoch 301 / 100000 - 2749 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0141 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0285 Iteration 80, loss = 0.0027 --- Epoch 302 / 100000 - 2750 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0215 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0066 --- Epoch 303 / 100000 - 2751 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0215 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0036 --- Epoch 304 / 100000 - 2752 epochs total Iteration 0, loss = 0.0096 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0028 --- Epoch 305 / 100000 - 2753 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0134 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0010 --- Epoch 306 / 100000 - 2754 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0084 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0014 --- Epoch 307 / 100000 - 2755 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0136 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0026 --- Epoch 308 / 100000 - 2756 epochs total Iteration 0, loss = 0.0369 Iteration 20, loss = 0.0169 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0174 Iteration 80, loss = 0.0123 --- Epoch 309 / 100000 - 2757 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0232 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0151 --- Epoch 310 / 100000 - 2758 epochs total Iteration 0, loss = 0.0110 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0106 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0119 --- Epoch 311 / 100000 - 2759 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0157 Iteration 80, loss = 0.0062 --- Epoch 312 / 100000 - 2760 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0439 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0138 Iteration 80, loss = 0.0211 --- Epoch 313 / 100000 - 2761 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0009 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0012 --- Epoch 314 / 100000 - 2762 epochs total Iteration 0, loss = 0.0131 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0170 Iteration 60, loss = 0.0177 Iteration 80, loss = 0.0178 --- Epoch 315 / 100000 - 2763 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0086 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0196 Iteration 80, loss = 0.0088 --- Epoch 316 / 100000 - 2764 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0138 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0046 --- Epoch 317 / 100000 - 2765 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0149 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0023 --- Epoch 318 / 100000 - 2766 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0065 Iteration 40, loss = 0.0166 Iteration 60, loss = 0.0204 Iteration 80, loss = 0.0100 --- Epoch 319 / 100000 - 2767 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0115 Iteration 40, loss = 0.0167 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0012 --- Epoch 320 / 100000 - 2768 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0119 --- Epoch 321 / 100000 - 2769 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0131 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0040 --- Epoch 322 / 100000 - 2770 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0164 Iteration 80, loss = 0.0131 --- Epoch 323 / 100000 - 2771 epochs total Iteration 0, loss = 0.0243 Iteration 20, loss = 0.0090 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0018 --- Epoch 324 / 100000 - 2772 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0180 Iteration 60, loss = 0.0203 Iteration 80, loss = 0.0300 --- Epoch 325 / 100000 - 2773 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0085 Iteration 40, loss = 0.0202 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0025 --- Epoch 326 / 100000 - 2774 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0327 Iteration 60, loss = 0.0142 Iteration 80, loss = 0.0072 --- Epoch 327 / 100000 - 2775 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0232 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0037 --- Epoch 328 / 100000 - 2776 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0306 --- Epoch 329 / 100000 - 2777 epochs total Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0136 Iteration 80, loss = 0.0319 --- Epoch 330 / 100000 - 2778 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0093 --- Epoch 331 / 100000 - 2779 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0070 --- Epoch 332 / 100000 - 2780 epochs total Iteration 0, loss = 0.0155 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0116 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0044 --- Epoch 333 / 100000 - 2781 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0177 Iteration 40, loss = 0.0134 Iteration 60, loss = 0.0121 Iteration 80, loss = 0.0037 --- Epoch 334 / 100000 - 2782 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0171 Iteration 80, loss = 0.0070 --- Epoch 335 / 100000 - 2783 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0155 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0065 --- Epoch 336 / 100000 - 2784 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0158 Iteration 60, loss = 0.0591 Iteration 80, loss = 0.0057 --- Epoch 337 / 100000 - 2785 epochs total Iteration 0, loss = 0.0230 Iteration 20, loss = 0.0300 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0221 Iteration 80, loss = 0.0169 --- Epoch 338 / 100000 - 2786 epochs total Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0250 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0094 --- Epoch 339 / 100000 - 2787 epochs total Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0239 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0123 Iteration 80, loss = 0.0107 --- Epoch 340 / 100000 - 2788 epochs total Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0171 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0031 --- Epoch 341 / 100000 - 2789 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0122 --- Epoch 342 / 100000 - 2790 epochs total Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0114 Iteration 60, loss = 0.0685 Iteration 80, loss = 0.0092 --- Epoch 343 / 100000 - 2791 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0235 Iteration 60, loss = 0.0172 Iteration 80, loss = 0.0051 --- Epoch 344 / 100000 - 2792 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0807 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0138 --- Epoch 345 / 100000 - 2793 epochs total Iteration 0, loss = 0.0148 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0099 Iteration 80, loss = 0.0048 --- Epoch 346 / 100000 - 2794 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0170 Iteration 80, loss = 0.0027 --- Epoch 347 / 100000 - 2795 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0218 Iteration 60, loss = 0.0213 Iteration 80, loss = 0.0049 --- Epoch 348 / 100000 - 2796 epochs total Iteration 0, loss = 0.0138 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0176 Iteration 60, loss = 0.0178 Iteration 80, loss = 0.0100 --- Epoch 349 / 100000 - 2797 epochs total Iteration 0, loss = 0.0231 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0054 --- Epoch 350 / 100000 - 2798 epochs total Iteration 0, loss = 0.0177 Iteration 20, loss = 0.0175 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0211 Iteration 80, loss = 0.0035 --- Epoch 351 / 100000 - 2799 epochs total Iteration 0, loss = 0.0144 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0036 --- Epoch 352 / 100000 - 2800 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0114 --- Epoch 353 / 100000 - 2801 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0148 --- Epoch 354 / 100000 - 2802 epochs total Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0044 --- Epoch 355 / 100000 - 2803 epochs total Iteration 0, loss = 0.0146 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0882 --- Epoch 356 / 100000 - 2804 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0140 Iteration 40, loss = 0.0124 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0097 --- Epoch 357 / 100000 - 2805 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0364 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0131 Iteration 80, loss = 0.0112 --- Epoch 358 / 100000 - 2806 epochs total Iteration 0, loss = 0.0133 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0278 --- Epoch 359 / 100000 - 2807 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0048 --- Epoch 360 / 100000 - 2808 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0111 Iteration 40, loss = 0.0145 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0024 --- Epoch 361 / 100000 - 2809 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0148 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0016 --- Epoch 362 / 100000 - 2810 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0010 --- Epoch 363 / 100000 - 2811 epochs total Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0135 Iteration 80, loss = 0.0036 --- Epoch 364 / 100000 - 2812 epochs total Iteration 0, loss = 0.0280 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0158 --- Epoch 365 / 100000 - 2813 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0144 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0027 --- Epoch 366 / 100000 - 2814 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0322 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0015 --- Epoch 367 / 100000 - 2815 epochs total Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0282 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0063 --- Epoch 368 / 100000 - 2816 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0115 Iteration 40, loss = 0.0135 Iteration 60, loss = 0.0164 Iteration 80, loss = 0.0084 --- Epoch 369 / 100000 - 2817 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0037 --- Epoch 370 / 100000 - 2818 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0093 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0058 --- Epoch 371 / 100000 - 2819 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0150 Iteration 80, loss = 0.0102 --- Epoch 372 / 100000 - 2820 epochs total Iteration 0, loss = 0.0170 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0219 --- Epoch 373 / 100000 - 2821 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0016 --- Epoch 374 / 100000 - 2822 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0126 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0023 --- Epoch 375 / 100000 - 2823 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0123 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0111 --- Epoch 376 / 100000 - 2824 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0169 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0352 Iteration 80, loss = 0.0037 --- Epoch 377 / 100000 - 2825 epochs total Iteration 0, loss = 0.0183 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0081 Iteration 60, loss = 0.0120 Iteration 80, loss = 0.0039 --- Epoch 378 / 100000 - 2826 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0275 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0041 --- Epoch 379 / 100000 - 2827 epochs total Iteration 0, loss = 0.0317 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0239 Iteration 80, loss = 0.0051 --- Epoch 380 / 100000 - 2828 epochs total Iteration 0, loss = 0.0159 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0087 --- Epoch 381 / 100000 - 2829 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0016 --- Epoch 382 / 100000 - 2830 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0008 Iteration 80, loss = 0.0044 --- Epoch 383 / 100000 - 2831 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0234 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0095 --- Epoch 384 / 100000 - 2832 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0263 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0228 Iteration 80, loss = 0.0047 --- Epoch 385 / 100000 - 2833 epochs total Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0097 Iteration 80, loss = 0.0053 --- Epoch 386 / 100000 - 2834 epochs total Iteration 0, loss = 0.0192 Iteration 20, loss = 0.0168 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0119 --- Epoch 387 / 100000 - 2835 epochs total Iteration 0, loss = 0.0083 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0010 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0051 --- Epoch 388 / 100000 - 2836 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0249 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0032 --- Epoch 389 / 100000 - 2837 epochs total Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0113 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0091 --- Epoch 390 / 100000 - 2838 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0258 --- Epoch 391 / 100000 - 2839 epochs total Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0049 --- Epoch 392 / 100000 - 2840 epochs total Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0707 Iteration 80, loss = 0.0114 --- Epoch 393 / 100000 - 2841 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0046 --- Epoch 394 / 100000 - 2842 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0112 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0082 --- Epoch 395 / 100000 - 2843 epochs total Iteration 0, loss = 0.0129 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0112 --- Epoch 396 / 100000 - 2844 epochs total Iteration 0, loss = 0.0201 Iteration 20, loss = 0.0138 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0039 --- Epoch 397 / 100000 - 2845 epochs total Iteration 0, loss = 0.0330 Iteration 20, loss = 0.0176 Iteration 40, loss = 0.0102 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0084 --- Epoch 398 / 100000 - 2846 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0076 --- Epoch 399 / 100000 - 2847 epochs total Iteration 0, loss = 0.0167 Iteration 20, loss = 0.0304 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0131 Iteration 80, loss = 0.0138 --- Epoch 400 / 100000 - 2848 epochs total Iteration 0, loss = 0.0182 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0358 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0033 --- Epoch 401 / 100000 - 2849 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0248 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0408 --- Epoch 402 / 100000 - 2850 epochs total Iteration 0, loss = 0.0139 Iteration 20, loss = 0.0249 Iteration 40, loss = 0.0178 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0020 --- Epoch 403 / 100000 - 2851 epochs total Iteration 0, loss = 0.0117 Iteration 20, loss = 0.0386 Iteration 40, loss = 0.0131 Iteration 60, loss = 0.0352 Iteration 80, loss = 0.0109 --- Epoch 404 / 100000 - 2852 epochs total Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0130 --- Epoch 405 / 100000 - 2853 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0133 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0089 --- Epoch 406 / 100000 - 2854 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0343 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0066 --- Epoch 407 / 100000 - 2855 epochs total Iteration 0, loss = 0.0090 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0506 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0030 --- Epoch 408 / 100000 - 2856 epochs total Iteration 0, loss = 0.0552 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0170 Iteration 60, loss = 0.0146 Iteration 80, loss = 0.0073 --- Epoch 409 / 100000 - 2857 epochs total Iteration 0, loss = 0.0151 Iteration 20, loss = 0.0229 Iteration 40, loss = 0.0074 Iteration 60, loss = 0.0101 Iteration 80, loss = 0.0061 --- Epoch 410 / 100000 - 2858 epochs total Iteration 0, loss = 0.0048 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0191 Iteration 80, loss = 0.0040 --- Epoch 411 / 100000 - 2859 epochs total Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0152 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0053 --- Epoch 412 / 100000 - 2860 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0085 Iteration 80, loss = 0.0135 --- Epoch 413 / 100000 - 2861 epochs total Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0122 Iteration 80, loss = 0.0074 --- Epoch 414 / 100000 - 2862 epochs total Iteration 0, loss = 0.0096 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0054 --- Epoch 415 / 100000 - 2863 epochs total Iteration 0, loss = 0.0452 Iteration 20, loss = 0.0132 Iteration 40, loss = 0.0078 Iteration 60, loss = 0.0085 Iteration 80, loss = 0.0154 --- Epoch 416 / 100000 - 2864 epochs total Iteration 0, loss = 0.0144 Iteration 20, loss = 0.0298 Iteration 40, loss = 0.0213 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0145 --- Epoch 417 / 100000 - 2865 epochs total Iteration 0, loss = 0.0071 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0282 --- Epoch 418 / 100000 - 2866 epochs total Iteration 0, loss = 0.0100 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0295 Iteration 80, loss = 0.0091 --- Epoch 419 / 100000 - 2867 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0171 --- Epoch 420 / 100000 - 2868 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0078 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0016 --- Epoch 421 / 100000 - 2869 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0121 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0017 --- Epoch 422 / 100000 - 2870 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0226 Iteration 80, loss = 0.0035 --- Epoch 423 / 100000 - 2871 epochs total Iteration 0, loss = 0.0159 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0115 --- Epoch 424 / 100000 - 2872 epochs total Iteration 0, loss = 0.0201 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0141 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0429 --- Epoch 425 / 100000 - 2873 epochs total Iteration 0, loss = 0.0147 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0014 --- Epoch 426 / 100000 - 2874 epochs total Iteration 0, loss = 0.0592 Iteration 20, loss = 0.0187 Iteration 40, loss = 0.0148 Iteration 60, loss = 0.0333 Iteration 80, loss = 0.0169 --- Epoch 427 / 100000 - 2875 epochs total Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0141 --- Epoch 428 / 100000 - 2876 epochs total Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0092 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0108 --- Epoch 429 / 100000 - 2877 epochs total Iteration 0, loss = 0.0217 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0201 --- Epoch 430 / 100000 - 2878 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0213 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0052 --- Epoch 431 / 100000 - 2879 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0090 Iteration 40, loss = 0.0179 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0013 --- Epoch 432 / 100000 - 2880 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0123 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0029 --- Epoch 433 / 100000 - 2881 epochs total Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0102 Iteration 80, loss = 0.0218 --- Epoch 434 / 100000 - 2882 epochs total Iteration 0, loss = 0.0149 Iteration 20, loss = 0.0172 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0110 --- Epoch 435 / 100000 - 2883 epochs total Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0229 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0066 --- Epoch 436 / 100000 - 2884 epochs total Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0127 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0087 --- Epoch 437 / 100000 - 2885 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0258 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0101 Iteration 80, loss = 0.0106 --- Epoch 438 / 100000 - 2886 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0181 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0221 --- Epoch 439 / 100000 - 2887 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0713 Iteration 80, loss = 0.0018 --- Epoch 440 / 100000 - 2888 epochs total Iteration 0, loss = 0.0158 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0017 --- Epoch 441 / 100000 - 2889 epochs total Iteration 0, loss = 0.0096 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0129 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0040 --- Epoch 442 / 100000 - 2890 epochs total Iteration 0, loss = 0.0268 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0490 --- Epoch 443 / 100000 - 2891 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0133 Iteration 80, loss = 0.0040 --- Epoch 444 / 100000 - 2892 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0158 Iteration 40, loss = 0.0114 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0223 --- Epoch 445 / 100000 - 2893 epochs total Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0286 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0070 --- Epoch 446 / 100000 - 2894 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0160 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0026 --- Epoch 447 / 100000 - 2895 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0136 Iteration 40, loss = 0.0199 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0029 --- Epoch 448 / 100000 - 2896 epochs total Iteration 0, loss = 0.0330 Iteration 20, loss = 0.0511 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0094 --- Epoch 449 / 100000 - 2897 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0011 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0083 --- Epoch 450 / 100000 - 2898 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0188 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0083 --- Epoch 451 / 100000 - 2899 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0036 --- Epoch 452 / 100000 - 2900 epochs total Iteration 0, loss = 0.0202 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0172 Iteration 80, loss = 0.0104 --- Epoch 453 / 100000 - 2901 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0150 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0137 --- Epoch 454 / 100000 - 2902 epochs total Iteration 0, loss = 0.0085 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0373 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0082 --- Epoch 455 / 100000 - 2903 epochs total Iteration 0, loss = 0.0144 Iteration 20, loss = 0.0086 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0259 --- Epoch 456 / 100000 - 2904 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0172 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0219 Iteration 80, loss = 0.0040 --- Epoch 457 / 100000 - 2905 epochs total Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0095 --- Epoch 458 / 100000 - 2906 epochs total Iteration 0, loss = 0.0457 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0088 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0100 --- Epoch 459 / 100000 - 2907 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0135 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0117 --- Epoch 460 / 100000 - 2908 epochs total Iteration 0, loss = 0.0388 Iteration 20, loss = 0.0169 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0146 --- Epoch 461 / 100000 - 2909 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0270 Iteration 40, loss = 0.0089 Iteration 60, loss = 0.0207 Iteration 80, loss = 0.0048 --- Epoch 462 / 100000 - 2910 epochs total Iteration 0, loss = 0.0238 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0171 Iteration 80, loss = 0.0201 --- Epoch 463 / 100000 - 2911 epochs total Iteration 0, loss = 0.0163 Iteration 20, loss = 0.0171 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0011 Iteration 80, loss = 0.0121 --- Epoch 464 / 100000 - 2912 epochs total Iteration 0, loss = 0.0008 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0174 Iteration 80, loss = 0.0183 --- Epoch 465 / 100000 - 2913 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0013 Iteration 80, loss = 0.0079 --- Epoch 466 / 100000 - 2914 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0165 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0047 --- Epoch 467 / 100000 - 2915 epochs total Iteration 0, loss = 0.0195 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0158 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0252 --- Epoch 468 / 100000 - 2916 epochs total Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0309 Iteration 40, loss = 0.0195 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0419 --- Epoch 469 / 100000 - 2917 epochs total Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0083 Iteration 80, loss = 0.0060 --- Epoch 470 / 100000 - 2918 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0025 --- Epoch 471 / 100000 - 2919 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0136 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0148 --- Epoch 472 / 100000 - 2920 epochs total Iteration 0, loss = 0.0147 Iteration 20, loss = 0.0134 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0084 --- Epoch 473 / 100000 - 2921 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0037 --- Epoch 474 / 100000 - 2922 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0192 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0344 --- Epoch 475 / 100000 - 2923 epochs total Iteration 0, loss = 0.0175 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0166 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0134 --- Epoch 476 / 100000 - 2924 epochs total Iteration 0, loss = 0.0196 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0037 --- Epoch 477 / 100000 - 2925 epochs total Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0079 --- Epoch 478 / 100000 - 2926 epochs total Iteration 0, loss = 0.0246 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0112 Iteration 80, loss = 0.0100 --- Epoch 479 / 100000 - 2927 epochs total Iteration 0, loss = 0.0082 Iteration 20, loss = 0.0195 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0120 Iteration 80, loss = 0.0164 --- Epoch 480 / 100000 - 2928 epochs total Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0346 Iteration 40, loss = 0.0203 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0035 --- Epoch 481 / 100000 - 2929 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0152 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0046 --- Epoch 482 / 100000 - 2930 epochs total Iteration 0, loss = 0.0303 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0162 Iteration 80, loss = 0.0054 --- Epoch 483 / 100000 - 2931 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0236 Iteration 80, loss = 0.0061 --- Epoch 484 / 100000 - 2932 epochs total Iteration 0, loss = 0.0650 Iteration 20, loss = 0.0114 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0018 --- Epoch 485 / 100000 - 2933 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0061 --- Epoch 486 / 100000 - 2934 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0086 --- Epoch 487 / 100000 - 2935 epochs total Iteration 0, loss = 0.0163 Iteration 20, loss = 0.0341 Iteration 40, loss = 0.0119 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0034 --- Epoch 488 / 100000 - 2936 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0205 Iteration 60, loss = 0.0055 Iteration 80, loss = 0.0199 --- Epoch 489 / 100000 - 2937 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0029 --- Epoch 490 / 100000 - 2938 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0126 Iteration 60, loss = 0.0136 Iteration 80, loss = 0.0111 --- Epoch 491 / 100000 - 2939 epochs total Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0065 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0299 Iteration 80, loss = 0.0207 --- Epoch 492 / 100000 - 2940 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0142 Iteration 80, loss = 0.0132 --- Epoch 493 / 100000 - 2941 epochs total Iteration 0, loss = 0.0188 Iteration 20, loss = 0.0296 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0044 --- Epoch 494 / 100000 - 2942 epochs total Iteration 0, loss = 0.0130 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0087 --- Epoch 495 / 100000 - 2943 epochs total Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0066 --- Epoch 496 / 100000 - 2944 epochs total Iteration 0, loss = 0.0462 Iteration 20, loss = 0.0314 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0178 Iteration 80, loss = 0.0037 --- Epoch 497 / 100000 - 2945 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0143 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0127 Iteration 80, loss = 0.0435 --- Epoch 498 / 100000 - 2946 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0026 --- Epoch 499 / 100000 - 2947 epochs total Iteration 0, loss = 0.0135 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0274 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0215 --- Epoch 500 / 100000 - 2948 epochs total Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0229 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0347 Iteration 80, loss = 0.0085 --- Epoch 501 / 100000 - 2949 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0051 --- Epoch 502 / 100000 - 2950 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0038 --- Epoch 503 / 100000 - 2951 epochs total Iteration 0, loss = 0.0135 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0012 --- Epoch 504 / 100000 - 2952 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0109 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0073 --- Epoch 505 / 100000 - 2953 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0083 --- Epoch 506 / 100000 - 2954 epochs total Iteration 0, loss = 0.0096 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0037 --- Epoch 507 / 100000 - 2955 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0309 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0032 --- Epoch 508 / 100000 - 2956 epochs total Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0329 Iteration 80, loss = 0.0050 --- Epoch 509 / 100000 - 2957 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0231 Iteration 80, loss = 0.0090 --- Epoch 510 / 100000 - 2958 epochs total Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0106 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0145 --- Epoch 511 / 100000 - 2959 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0094 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0302 --- Epoch 512 / 100000 - 2960 epochs total Iteration 0, loss = 0.0123 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0188 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0098 --- Epoch 513 / 100000 - 2961 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0053 --- Epoch 514 / 100000 - 2962 epochs total Iteration 0, loss = 0.0189 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0110 Iteration 80, loss = 0.0229 --- Epoch 515 / 100000 - 2963 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0106 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0241 Iteration 80, loss = 0.0072 --- Epoch 516 / 100000 - 2964 epochs total Iteration 0, loss = 0.0244 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0084 Iteration 60, loss = 0.0203 Iteration 80, loss = 0.0194 --- Epoch 517 / 100000 - 2965 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0059 --- Epoch 518 / 100000 - 2966 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0225 Iteration 40, loss = 0.0901 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0017 --- Epoch 519 / 100000 - 2967 epochs total Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0183 --- Epoch 520 / 100000 - 2968 epochs total Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0059 --- Epoch 521 / 100000 - 2969 epochs total Iteration 0, loss = 0.0297 Iteration 20, loss = 0.0123 Iteration 40, loss = 0.0145 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0139 --- Epoch 522 / 100000 - 2970 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0191 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0135 --- Epoch 523 / 100000 - 2971 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0038 --- Epoch 524 / 100000 - 2972 epochs total Iteration 0, loss = 0.0284 Iteration 20, loss = 0.0099 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0050 --- Epoch 525 / 100000 - 2973 epochs total Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0156 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0059 --- Epoch 526 / 100000 - 2974 epochs total Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0092 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0064 --- Epoch 527 / 100000 - 2975 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0129 --- Epoch 528 / 100000 - 2976 epochs total Iteration 0, loss = 0.0548 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0080 --- Epoch 529 / 100000 - 2977 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0272 Iteration 40, loss = 0.0123 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0209 --- Epoch 530 / 100000 - 2978 epochs total Iteration 0, loss = 0.0159 Iteration 20, loss = 0.0309 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0108 --- Epoch 531 / 100000 - 2979 epochs total Iteration 0, loss = 0.0084 Iteration 20, loss = 0.0087 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0040 --- Epoch 532 / 100000 - 2980 epochs total Iteration 0, loss = 0.0294 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0061 --- Epoch 533 / 100000 - 2981 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0290 --- Epoch 534 / 100000 - 2982 epochs total Iteration 0, loss = 0.0671 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0367 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0180 --- Epoch 535 / 100000 - 2983 epochs total Iteration 0, loss = 0.0110 Iteration 20, loss = 0.0010 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0306 Iteration 80, loss = 0.0119 --- Epoch 536 / 100000 - 2984 epochs total Iteration 0, loss = 0.0165 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0032 --- Epoch 537 / 100000 - 2985 epochs total Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0106 Iteration 40, loss = 0.0185 Iteration 60, loss = 0.0121 Iteration 80, loss = 0.0037 --- Epoch 538 / 100000 - 2986 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0247 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0054 --- Epoch 539 / 100000 - 2987 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0280 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0137 --- Epoch 540 / 100000 - 2988 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0197 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0040 --- Epoch 541 / 100000 - 2989 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0174 Iteration 40, loss = 0.0173 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0049 --- Epoch 542 / 100000 - 2990 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0346 Iteration 80, loss = 0.0028 --- Epoch 543 / 100000 - 2991 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0024 --- Epoch 544 / 100000 - 2992 epochs total Iteration 0, loss = 0.0401 Iteration 20, loss = 0.0229 Iteration 40, loss = 0.0464 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0024 --- Epoch 545 / 100000 - 2993 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0396 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0084 --- Epoch 546 / 100000 - 2994 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0119 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0340 Iteration 80, loss = 0.0076 --- Epoch 547 / 100000 - 2995 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0146 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0065 --- Epoch 548 / 100000 - 2996 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0180 Iteration 40, loss = 0.0250 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0014 --- Epoch 549 / 100000 - 2997 epochs total Iteration 0, loss = 0.0245 Iteration 20, loss = 0.0153 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0161 Iteration 80, loss = 0.0047 --- Epoch 550 / 100000 - 2998 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0093 --- Epoch 551 / 100000 - 2999 epochs total Iteration 0, loss = 0.0232 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0262 --- Epoch 552 / 100000 - 3000 epochs total Iteration 0, loss = 0.0120 Iteration 20, loss = 0.0419 Iteration 40, loss = 0.0122 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0162 --- Epoch 553 / 100000 - 3001 epochs total Iteration 0, loss = 0.0147 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0124 Iteration 80, loss = 0.0102 --- Epoch 554 / 100000 - 3002 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0186 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0281 Iteration 80, loss = 0.0221 --- Epoch 555 / 100000 - 3003 epochs total Iteration 0, loss = 0.0179 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0331 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0025 --- Epoch 556 / 100000 - 3004 epochs total Iteration 0, loss = 0.0104 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0197 Iteration 60, loss = 0.0225 Iteration 80, loss = 0.0034 --- Epoch 557 / 100000 - 3005 epochs total Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0035 --- Epoch 558 / 100000 - 3006 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0186 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0023 --- Epoch 559 / 100000 - 3007 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0173 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0067 --- Epoch 560 / 100000 - 3008 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0155 Iteration 80, loss = 0.0077 --- Epoch 561 / 100000 - 3009 epochs total Iteration 0, loss = 0.0198 Iteration 20, loss = 0.0261 Iteration 40, loss = 0.0141 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0020 --- Epoch 562 / 100000 - 3010 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0114 --- Epoch 563 / 100000 - 3011 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0089 Iteration 80, loss = 0.0062 --- Epoch 564 / 100000 - 3012 epochs total Iteration 0, loss = 0.0234 Iteration 20, loss = 0.0306 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0083 Iteration 80, loss = 0.0166 --- Epoch 565 / 100000 - 3013 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0076 --- Epoch 566 / 100000 - 3014 epochs total Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0199 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0107 --- Epoch 567 / 100000 - 3015 epochs total Iteration 0, loss = 0.0268 Iteration 20, loss = 0.0247 Iteration 40, loss = 0.0285 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0045 --- Epoch 568 / 100000 - 3016 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0160 Iteration 80, loss = 0.0245 --- Epoch 569 / 100000 - 3017 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0161 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0254 --- Epoch 570 / 100000 - 3018 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0036 --- Epoch 571 / 100000 - 3019 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0016 --- Epoch 572 / 100000 - 3020 epochs total Iteration 0, loss = 0.0101 Iteration 20, loss = 0.0111 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0102 Iteration 80, loss = 0.0156 --- Epoch 573 / 100000 - 3021 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0274 Iteration 60, loss = 0.0228 Iteration 80, loss = 0.0013 --- Epoch 574 / 100000 - 3022 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0181 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0048 --- Epoch 575 / 100000 - 3023 epochs total Iteration 0, loss = 0.0124 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0186 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0022 --- Epoch 576 / 100000 - 3024 epochs total Iteration 0, loss = 0.0191 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0112 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0090 --- Epoch 577 / 100000 - 3025 epochs total Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0012 --- Epoch 578 / 100000 - 3026 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0214 --- Epoch 579 / 100000 - 3027 epochs total Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0345 --- Epoch 580 / 100000 - 3028 epochs total Iteration 0, loss = 0.0290 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0180 Iteration 80, loss = 0.0287 --- Epoch 581 / 100000 - 3029 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0170 Iteration 80, loss = 0.0088 --- Epoch 582 / 100000 - 3030 epochs total Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0083 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0016 --- Epoch 583 / 100000 - 3031 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0098 --- Epoch 584 / 100000 - 3032 epochs total Iteration 0, loss = 0.0151 Iteration 20, loss = 0.0205 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0130 Iteration 80, loss = 0.0038 --- Epoch 585 / 100000 - 3033 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0304 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0374 --- Epoch 586 / 100000 - 3034 epochs total Iteration 0, loss = 0.0077 Iteration 20, loss = 0.0188 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0388 --- Epoch 587 / 100000 - 3035 epochs total Iteration 0, loss = 0.0069 Iteration 20, loss = 0.0108 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0028 --- Epoch 588 / 100000 - 3036 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0158 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0020 --- Epoch 589 / 100000 - 3037 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0152 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0021 --- Epoch 590 / 100000 - 3038 epochs total Iteration 0, loss = 0.0147 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0108 Iteration 60, loss = 0.0208 Iteration 80, loss = 0.0101 --- Epoch 591 / 100000 - 3039 epochs total Iteration 0, loss = 0.0665 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0150 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0120 --- Epoch 592 / 100000 - 3040 epochs total Iteration 0, loss = 0.0193 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0111 --- Epoch 593 / 100000 - 3041 epochs total Iteration 0, loss = 0.0292 Iteration 20, loss = 0.0414 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0182 --- Epoch 594 / 100000 - 3042 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0166 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0032 --- Epoch 595 / 100000 - 3043 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0127 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0026 --- Epoch 596 / 100000 - 3044 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0361 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0056 --- Epoch 597 / 100000 - 3045 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0056 --- Epoch 598 / 100000 - 3046 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0084 Iteration 60, loss = 0.0130 Iteration 80, loss = 0.0070 --- Epoch 599 / 100000 - 3047 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0265 Iteration 40, loss = 0.0240 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0114 --- Epoch 600 / 100000 - 3048 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0037 --- Epoch 601 / 100000 - 3049 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0455 Iteration 40, loss = 0.0124 Iteration 60, loss = 0.0156 Iteration 80, loss = 0.0194 --- Epoch 602 / 100000 - 3050 epochs total Iteration 0, loss = 0.0168 Iteration 20, loss = 0.0171 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0161 --- Epoch 603 / 100000 - 3051 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0298 Iteration 60, loss = 0.0108 Iteration 80, loss = 0.0075 --- Epoch 604 / 100000 - 3052 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0176 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0023 --- Epoch 605 / 100000 - 3053 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0102 Iteration 60, loss = 0.0094 Iteration 80, loss = 0.0034 --- Epoch 606 / 100000 - 3054 epochs total Iteration 0, loss = 0.0146 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0071 --- Epoch 607 / 100000 - 3055 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0149 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0118 --- Epoch 608 / 100000 - 3056 epochs total Iteration 0, loss = 0.0154 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0123 Iteration 80, loss = 0.0028 --- Epoch 609 / 100000 - 3057 epochs total Iteration 0, loss = 0.0008 Iteration 20, loss = 0.0147 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0068 --- Epoch 610 / 100000 - 3058 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0222 --- Epoch 611 / 100000 - 3059 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0135 Iteration 80, loss = 0.0168 --- Epoch 612 / 100000 - 3060 epochs total Iteration 0, loss = 0.0070 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0383 Iteration 80, loss = 0.0036 --- Epoch 613 / 100000 - 3061 epochs total Iteration 0, loss = 0.0153 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0056 --- Epoch 614 / 100000 - 3062 epochs total Iteration 0, loss = 0.0133 Iteration 20, loss = 0.0152 Iteration 40, loss = 0.0005 Iteration 60, loss = 0.0207 Iteration 80, loss = 0.0099 --- Epoch 615 / 100000 - 3063 epochs total Iteration 0, loss = 0.0179 Iteration 20, loss = 0.0099 Iteration 40, loss = 0.0299 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0097 --- Epoch 616 / 100000 - 3064 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0085 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0046 --- Epoch 617 / 100000 - 3065 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0099 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0088 --- Epoch 618 / 100000 - 3066 epochs total Iteration 0, loss = 0.0416 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0318 Iteration 80, loss = 0.0135 --- Epoch 619 / 100000 - 3067 epochs total Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0094 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0047 --- Epoch 620 / 100000 - 3068 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0120 Iteration 40, loss = 0.0211 Iteration 60, loss = 0.0417 Iteration 80, loss = 0.0112 --- Epoch 621 / 100000 - 3069 epochs total Iteration 0, loss = 0.0203 Iteration 20, loss = 0.0229 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0069 --- Epoch 622 / 100000 - 3070 epochs total Iteration 0, loss = 0.0177 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0250 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0050 --- Epoch 623 / 100000 - 3071 epochs total Iteration 0, loss = 0.0062 Iteration 20, loss = 0.0090 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0089 --- Epoch 624 / 100000 - 3072 epochs total Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0210 Iteration 40, loss = 0.0290 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0021 --- Epoch 625 / 100000 - 3073 epochs total Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0044 --- Epoch 626 / 100000 - 3074 epochs total Iteration 0, loss = 0.0109 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0065 --- Epoch 627 / 100000 - 3075 epochs total Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0484 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0109 --- Epoch 628 / 100000 - 3076 epochs total Iteration 0, loss = 0.0180 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0104 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0019 --- Epoch 629 / 100000 - 3077 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0202 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0117 Iteration 80, loss = 0.0041 --- Epoch 630 / 100000 - 3078 epochs total Iteration 0, loss = 0.0167 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0151 Iteration 80, loss = 0.0074 --- Epoch 631 / 100000 - 3079 epochs total Iteration 0, loss = 0.0168 Iteration 20, loss = 0.0049 Iteration 40, loss = 0.0295 Iteration 60, loss = 0.0202 Iteration 80, loss = 0.0041 --- Epoch 632 / 100000 - 3080 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0158 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0166 Iteration 80, loss = 0.0191 --- Epoch 633 / 100000 - 3081 epochs total Iteration 0, loss = 0.0097 Iteration 20, loss = 0.0130 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0128 Iteration 80, loss = 0.0052 --- Epoch 634 / 100000 - 3082 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0202 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0023 --- Epoch 635 / 100000 - 3083 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0317 Iteration 80, loss = 0.0035 --- Epoch 636 / 100000 - 3084 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0156 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0023 --- Epoch 637 / 100000 - 3085 epochs total Iteration 0, loss = 0.0138 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0290 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0044 --- Epoch 638 / 100000 - 3086 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0082 --- Epoch 639 / 100000 - 3087 epochs total Iteration 0, loss = 0.0301 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0204 Iteration 60, loss = 0.0236 Iteration 80, loss = 0.0009 --- Epoch 640 / 100000 - 3088 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0280 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0070 --- Epoch 641 / 100000 - 3089 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0083 Iteration 80, loss = 0.0061 --- Epoch 642 / 100000 - 3090 epochs total Iteration 0, loss = 0.0170 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0179 Iteration 80, loss = 0.0037 --- Epoch 643 / 100000 - 3091 epochs total Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0146 Iteration 40, loss = 0.0168 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0064 --- Epoch 644 / 100000 - 3092 epochs total Iteration 0, loss = 0.0109 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0211 Iteration 80, loss = 0.0029 --- Epoch 645 / 100000 - 3093 epochs total Iteration 0, loss = 0.0115 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0257 --- Epoch 646 / 100000 - 3094 epochs total Iteration 0, loss = 0.0166 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0229 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0045 --- Epoch 647 / 100000 - 3095 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0328 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0135 Iteration 80, loss = 0.0089 --- Epoch 648 / 100000 - 3096 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0112 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0018 --- Epoch 649 / 100000 - 3097 epochs total Iteration 0, loss = 0.0279 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0031 --- Epoch 650 / 100000 - 3098 epochs total Iteration 0, loss = 0.0105 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0140 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0177 --- Epoch 651 / 100000 - 3099 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0035 --- Epoch 652 / 100000 - 3100 epochs total Iteration 0, loss = 0.0198 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0268 Iteration 80, loss = 0.0046 --- Epoch 653 / 100000 - 3101 epochs total Iteration 0, loss = 0.0090 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0208 Iteration 60, loss = 0.0158 Iteration 80, loss = 0.0047 --- Epoch 654 / 100000 - 3102 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0162 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0092 --- Epoch 655 / 100000 - 3103 epochs total Iteration 0, loss = 0.0199 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0200 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0677 --- Epoch 656 / 100000 - 3104 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0528 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0031 --- Epoch 657 / 100000 - 3105 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0211 Iteration 60, loss = 0.0085 Iteration 80, loss = 0.0108 --- Epoch 658 / 100000 - 3106 epochs total Iteration 0, loss = 0.0214 Iteration 20, loss = 0.0166 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0040 --- Epoch 659 / 100000 - 3107 epochs total Iteration 0, loss = 0.0243 Iteration 20, loss = 0.0166 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0011 Iteration 80, loss = 0.0114 --- Epoch 660 / 100000 - 3108 epochs total Iteration 0, loss = 0.0300 Iteration 20, loss = 0.0082 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0070 --- Epoch 661 / 100000 - 3109 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0130 --- Epoch 662 / 100000 - 3110 epochs total Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0140 --- Epoch 663 / 100000 - 3111 epochs total Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0159 Iteration 60, loss = 0.0130 Iteration 80, loss = 0.0626 --- Epoch 664 / 100000 - 3112 epochs total Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0265 Iteration 80, loss = 0.0130 --- Epoch 665 / 100000 - 3113 epochs total Iteration 0, loss = 0.0091 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0238 Iteration 60, loss = 0.0261 Iteration 80, loss = 0.0047 --- Epoch 666 / 100000 - 3114 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0303 Iteration 60, loss = 0.0108 Iteration 80, loss = 0.0022 --- Epoch 667 / 100000 - 3115 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0031 --- Epoch 668 / 100000 - 3116 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0008 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0305 --- Epoch 669 / 100000 - 3117 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0592 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0096 --- Epoch 670 / 100000 - 3118 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0146 Iteration 60, loss = 0.0085 Iteration 80, loss = 0.0418 --- Epoch 671 / 100000 - 3119 epochs total Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0170 Iteration 80, loss = 0.0064 --- Epoch 672 / 100000 - 3120 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0845 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0101 --- Epoch 673 / 100000 - 3121 epochs total Iteration 0, loss = 0.0222 Iteration 20, loss = 0.0150 Iteration 40, loss = 0.0177 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0050 --- Epoch 674 / 100000 - 3122 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0086 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0015 --- Epoch 675 / 100000 - 3123 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0116 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0392 --- Epoch 676 / 100000 - 3124 epochs total Iteration 0, loss = 0.0161 Iteration 20, loss = 0.0091 Iteration 40, loss = 0.0954 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0109 --- Epoch 677 / 100000 - 3125 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0070 --- Epoch 678 / 100000 - 3126 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0053 --- Epoch 679 / 100000 - 3127 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0160 Iteration 80, loss = 0.0053 --- Epoch 680 / 100000 - 3128 epochs total Iteration 0, loss = 0.0010 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0263 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0039 --- Epoch 681 / 100000 - 3129 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0180 Iteration 80, loss = 0.0043 --- Epoch 682 / 100000 - 3130 epochs total Iteration 0, loss = 0.0322 Iteration 20, loss = 0.0291 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0127 Iteration 80, loss = 0.0058 --- Epoch 683 / 100000 - 3131 epochs total Iteration 0, loss = 0.0233 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0113 Iteration 60, loss = 0.0340 Iteration 80, loss = 0.0078 --- Epoch 684 / 100000 - 3132 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0126 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0111 --- Epoch 685 / 100000 - 3133 epochs total Iteration 0, loss = 0.0113 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0177 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0094 --- Epoch 686 / 100000 - 3134 epochs total Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0179 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0035 --- Epoch 687 / 100000 - 3135 epochs total Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0168 Iteration 80, loss = 0.0030 --- Epoch 688 / 100000 - 3136 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0161 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0090 --- Epoch 689 / 100000 - 3137 epochs total Iteration 0, loss = 0.0594 Iteration 20, loss = 0.0210 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0083 Iteration 80, loss = 0.0013 --- Epoch 690 / 100000 - 3138 epochs total Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0084 Iteration 60, loss = 0.0169 Iteration 80, loss = 0.0016 --- Epoch 691 / 100000 - 3139 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0078 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0416 Iteration 80, loss = 0.0084 --- Epoch 692 / 100000 - 3140 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0084 Iteration 40, loss = 0.0419 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0056 --- Epoch 693 / 100000 - 3141 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0136 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0018 Iteration 80, loss = 0.0062 --- Epoch 694 / 100000 - 3142 epochs total Iteration 0, loss = 0.0133 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0340 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0018 --- Epoch 695 / 100000 - 3143 epochs total Iteration 0, loss = 0.0052 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0038 --- Epoch 696 / 100000 - 3144 epochs total Iteration 0, loss = 0.0018 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0136 Iteration 80, loss = 0.0090 --- Epoch 697 / 100000 - 3145 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0153 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0096 --- Epoch 698 / 100000 - 3146 epochs total Iteration 0, loss = 0.0082 Iteration 20, loss = 0.0154 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0239 Iteration 80, loss = 0.0087 --- Epoch 699 / 100000 - 3147 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0195 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0008 --- Epoch 700 / 100000 - 3148 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0117 Iteration 40, loss = 0.0170 Iteration 60, loss = 0.0229 Iteration 80, loss = 0.0188 --- Epoch 701 / 100000 - 3149 epochs total Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0419 Iteration 80, loss = 0.0132 --- Epoch 702 / 100000 - 3150 epochs total Iteration 0, loss = 0.0221 Iteration 20, loss = 0.0199 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0115 --- Epoch 703 / 100000 - 3151 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0217 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0073 --- Epoch 704 / 100000 - 3152 epochs total Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0009 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0139 --- Epoch 705 / 100000 - 3153 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0070 Iteration 80, loss = 0.0143 --- Epoch 706 / 100000 - 3154 epochs total Iteration 0, loss = 0.0437 Iteration 20, loss = 0.0064 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0039 --- Epoch 707 / 100000 - 3155 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0085 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0173 --- Epoch 708 / 100000 - 3156 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0145 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0153 Iteration 80, loss = 0.0134 --- Epoch 709 / 100000 - 3157 epochs total Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0245 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0085 Iteration 80, loss = 0.0164 --- Epoch 710 / 100000 - 3158 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0239 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0027 --- Epoch 711 / 100000 - 3159 epochs total Iteration 0, loss = 0.0220 Iteration 20, loss = 0.0134 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0021 --- Epoch 712 / 100000 - 3160 epochs total Iteration 0, loss = 0.0256 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0113 Iteration 80, loss = 0.0068 --- Epoch 713 / 100000 - 3161 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0150 Iteration 40, loss = 0.0150 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0610 --- Epoch 714 / 100000 - 3162 epochs total Iteration 0, loss = 0.0100 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0137 Iteration 80, loss = 0.0086 --- Epoch 715 / 100000 - 3163 epochs total Iteration 0, loss = 0.0074 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0182 Iteration 80, loss = 0.0068 --- Epoch 716 / 100000 - 3164 epochs total Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0132 Iteration 60, loss = 0.0185 Iteration 80, loss = 0.0039 --- Epoch 717 / 100000 - 3165 epochs total Iteration 0, loss = 0.0103 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0200 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0121 --- Epoch 718 / 100000 - 3166 epochs total Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0131 Iteration 40, loss = 0.0196 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0017 --- Epoch 719 / 100000 - 3167 epochs total Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0078 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0059 --- Epoch 720 / 100000 - 3168 epochs total Iteration 0, loss = 0.0624 Iteration 20, loss = 0.0036 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0071 --- Epoch 721 / 100000 - 3169 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0314 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0347 --- Epoch 722 / 100000 - 3170 epochs total Iteration 0, loss = 0.0101 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0143 Iteration 60, loss = 0.0152 Iteration 80, loss = 0.0017 --- Epoch 723 / 100000 - 3171 epochs total Iteration 0, loss = 0.0146 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0201 --- Epoch 724 / 100000 - 3172 epochs total Iteration 0, loss = 0.0092 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0090 --- Epoch 725 / 100000 - 3173 epochs total Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0204 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0114 --- Epoch 726 / 100000 - 3174 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0072 Iteration 80, loss = 0.0087 --- Epoch 727 / 100000 - 3175 epochs total Iteration 0, loss = 0.0186 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0204 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0078 --- Epoch 728 / 100000 - 3176 epochs total Iteration 0, loss = 0.0214 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0082 Iteration 80, loss = 0.0090 --- Epoch 729 / 100000 - 3177 epochs total Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0106 Iteration 40, loss = 0.0185 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0192 --- Epoch 730 / 100000 - 3178 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0161 Iteration 80, loss = 0.0457 --- Epoch 731 / 100000 - 3179 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0152 Iteration 80, loss = 0.0482 --- Epoch 732 / 100000 - 3180 epochs total Iteration 0, loss = 0.0095 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0024 --- Epoch 733 / 100000 - 3181 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0174 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0121 --- Epoch 734 / 100000 - 3182 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0049 --- Epoch 735 / 100000 - 3183 epochs total Iteration 0, loss = 0.0340 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0083 Iteration 60, loss = 0.0174 Iteration 80, loss = 0.0023 --- Epoch 736 / 100000 - 3184 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0256 Iteration 40, loss = 0.0099 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0025 --- Epoch 737 / 100000 - 3185 epochs total Iteration 0, loss = 0.0372 Iteration 20, loss = 0.0137 Iteration 40, loss = 0.0152 Iteration 60, loss = 0.0150 Iteration 80, loss = 0.0051 --- Epoch 738 / 100000 - 3186 epochs total Iteration 0, loss = 0.0178 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0051 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0040 --- Epoch 739 / 100000 - 3187 epochs total Iteration 0, loss = 0.0494 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0240 Iteration 80, loss = 0.0037 --- Epoch 740 / 100000 - 3188 epochs total Iteration 0, loss = 0.0086 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0021 --- Epoch 741 / 100000 - 3189 epochs total Iteration 0, loss = 0.0265 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0087 --- Epoch 742 / 100000 - 3190 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0087 Iteration 40, loss = 0.0010 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0113 --- Epoch 743 / 100000 - 3191 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0045 --- Epoch 744 / 100000 - 3192 epochs total Iteration 0, loss = 0.0123 Iteration 20, loss = 0.0103 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0166 --- Epoch 745 / 100000 - 3193 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0186 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0130 --- Epoch 746 / 100000 - 3194 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0031 --- Epoch 747 / 100000 - 3195 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0109 Iteration 40, loss = 0.0246 Iteration 60, loss = 0.0271 Iteration 80, loss = 0.0047 --- Epoch 748 / 100000 - 3196 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0089 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0064 Iteration 80, loss = 0.0019 --- Epoch 749 / 100000 - 3197 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0073 Iteration 80, loss = 0.0351 --- Epoch 750 / 100000 - 3198 epochs total Iteration 0, loss = 0.0296 Iteration 20, loss = 0.0365 Iteration 40, loss = 0.0226 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0044 --- Epoch 751 / 100000 - 3199 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0078 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0119 --- Epoch 752 / 100000 - 3200 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0081 Iteration 60, loss = 0.0127 Iteration 80, loss = 0.0024 --- Epoch 753 / 100000 - 3201 epochs total Iteration 0, loss = 0.0197 Iteration 20, loss = 0.0225 Iteration 40, loss = 0.0135 Iteration 60, loss = 0.0197 Iteration 80, loss = 0.0064 --- Epoch 754 / 100000 - 3202 epochs total Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0090 --- Epoch 755 / 100000 - 3203 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0231 Iteration 60, loss = 0.0062 Iteration 80, loss = 0.0026 --- Epoch 756 / 100000 - 3204 epochs total Iteration 0, loss = 0.0011 Iteration 20, loss = 0.0116 Iteration 40, loss = 0.0101 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0013 --- Epoch 757 / 100000 - 3205 epochs total Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0267 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0079 --- Epoch 758 / 100000 - 3206 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0100 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0081 --- Epoch 759 / 100000 - 3207 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0157 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0055 --- Epoch 760 / 100000 - 3208 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0276 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0098 --- Epoch 761 / 100000 - 3209 epochs total Iteration 0, loss = 0.0158 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0072 --- Epoch 762 / 100000 - 3210 epochs total Iteration 0, loss = 0.0132 Iteration 20, loss = 0.0199 Iteration 40, loss = 0.0230 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0130 --- Epoch 763 / 100000 - 3211 epochs total Iteration 0, loss = 0.0190 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0676 Iteration 80, loss = 0.0034 --- Epoch 764 / 100000 - 3212 epochs total Iteration 0, loss = 0.0151 Iteration 20, loss = 0.0099 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0022 --- Epoch 765 / 100000 - 3213 epochs total Iteration 0, loss = 0.0121 Iteration 20, loss = 0.0086 Iteration 40, loss = 0.0066 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0033 --- Epoch 766 / 100000 - 3214 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0248 Iteration 40, loss = 0.0630 Iteration 60, loss = 0.0098 Iteration 80, loss = 0.0032 --- Epoch 767 / 100000 - 3215 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0250 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0180 Iteration 80, loss = 0.0056 --- Epoch 768 / 100000 - 3216 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0377 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0177 Iteration 80, loss = 0.0108 --- Epoch 769 / 100000 - 3217 epochs total Iteration 0, loss = 0.0383 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0129 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0073 --- Epoch 770 / 100000 - 3218 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0041 Iteration 80, loss = 0.0261 --- Epoch 771 / 100000 - 3219 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0153 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0069 --- Epoch 772 / 100000 - 3220 epochs total Iteration 0, loss = 0.0155 Iteration 20, loss = 0.0342 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0064 --- Epoch 773 / 100000 - 3221 epochs total Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0103 --- Epoch 774 / 100000 - 3222 epochs total Iteration 0, loss = 0.0072 Iteration 20, loss = 0.0095 Iteration 40, loss = 0.0160 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0022 --- Epoch 775 / 100000 - 3223 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0218 Iteration 40, loss = 0.0312 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0101 --- Epoch 776 / 100000 - 3224 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0130 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0015 Iteration 80, loss = 0.0040 --- Epoch 777 / 100000 - 3225 epochs total Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0160 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0084 --- Epoch 778 / 100000 - 3226 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0092 Iteration 60, loss = 0.0150 Iteration 80, loss = 0.0026 --- Epoch 779 / 100000 - 3227 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0137 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0032 --- Epoch 780 / 100000 - 3228 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0139 Iteration 80, loss = 0.0025 --- Epoch 781 / 100000 - 3229 epochs total Iteration 0, loss = 0.0111 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0200 Iteration 60, loss = 0.0202 Iteration 80, loss = 0.0018 --- Epoch 782 / 100000 - 3230 epochs total Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0165 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0195 Iteration 80, loss = 0.0093 --- Epoch 783 / 100000 - 3231 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0084 --- Epoch 784 / 100000 - 3232 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0128 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0026 --- Epoch 785 / 100000 - 3233 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0177 --- Epoch 786 / 100000 - 3234 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0050 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0466 --- Epoch 787 / 100000 - 3235 epochs total Iteration 0, loss = 0.0223 Iteration 20, loss = 0.0303 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0385 Iteration 80, loss = 0.0141 --- Epoch 788 / 100000 - 3236 epochs total Iteration 0, loss = 0.0194 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0128 Iteration 80, loss = 0.0038 --- Epoch 789 / 100000 - 3237 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0133 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0113 --- Epoch 790 / 100000 - 3238 epochs total Iteration 0, loss = 0.0096 Iteration 20, loss = 0.0179 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0183 --- Epoch 791 / 100000 - 3239 epochs total Iteration 0, loss = 0.0201 Iteration 20, loss = 0.0097 Iteration 40, loss = 0.0224 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0087 --- Epoch 792 / 100000 - 3240 epochs total Iteration 0, loss = 0.0164 Iteration 20, loss = 0.0165 Iteration 40, loss = 0.0088 Iteration 60, loss = 0.0113 Iteration 80, loss = 0.0359 --- Epoch 793 / 100000 - 3241 epochs total Iteration 0, loss = 0.0156 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0139 Iteration 80, loss = 0.0099 --- Epoch 794 / 100000 - 3242 epochs total Iteration 0, loss = 0.0294 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0103 Iteration 80, loss = 0.0168 --- Epoch 795 / 100000 - 3243 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0118 Iteration 60, loss = 0.0233 Iteration 80, loss = 0.0098 --- Epoch 796 / 100000 - 3244 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0159 Iteration 40, loss = 0.0195 Iteration 60, loss = 0.0190 Iteration 80, loss = 0.0063 --- Epoch 797 / 100000 - 3245 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0179 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0222 --- Epoch 798 / 100000 - 3246 epochs total Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0009 Iteration 80, loss = 0.0104 --- Epoch 799 / 100000 - 3247 epochs total Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0027 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0157 --- Epoch 800 / 100000 - 3248 epochs total Iteration 0, loss = 0.0122 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0204 Iteration 80, loss = 0.0091 --- Epoch 801 / 100000 - 3249 epochs total Iteration 0, loss = 0.0330 Iteration 20, loss = 0.0108 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0139 --- Epoch 802 / 100000 - 3250 epochs total Iteration 0, loss = 0.0104 Iteration 20, loss = 0.0240 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0148 --- Epoch 803 / 100000 - 3251 epochs total Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0184 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0171 --- Epoch 804 / 100000 - 3252 epochs total Iteration 0, loss = 0.0264 Iteration 20, loss = 0.0424 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0163 --- Epoch 805 / 100000 - 3253 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0134 Iteration 80, loss = 0.0167 --- Epoch 806 / 100000 - 3254 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0085 Iteration 40, loss = 0.0059 Iteration 60, loss = 0.0091 Iteration 80, loss = 0.0208 --- Epoch 807 / 100000 - 3255 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0217 Iteration 40, loss = 0.0172 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0170 --- Epoch 808 / 100000 - 3256 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0171 Iteration 40, loss = 0.0225 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0045 --- Epoch 809 / 100000 - 3257 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0100 --- Epoch 810 / 100000 - 3258 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0053 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0062 --- Epoch 811 / 100000 - 3259 epochs total Iteration 0, loss = 0.0033 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0120 --- Epoch 812 / 100000 - 3260 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0181 Iteration 40, loss = 0.0505 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0384 --- Epoch 813 / 100000 - 3261 epochs total Iteration 0, loss = 0.0203 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0037 Iteration 80, loss = 0.0247 --- Epoch 814 / 100000 - 3262 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0031 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0200 --- Epoch 815 / 100000 - 3263 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0047 --- Epoch 816 / 100000 - 3264 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0195 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0100 --- Epoch 817 / 100000 - 3265 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0044 --- Epoch 818 / 100000 - 3266 epochs total Iteration 0, loss = 0.0094 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0106 --- Epoch 819 / 100000 - 3267 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0096 Iteration 80, loss = 0.0017 --- Epoch 820 / 100000 - 3268 epochs total Iteration 0, loss = 0.0113 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0176 Iteration 80, loss = 0.0157 --- Epoch 821 / 100000 - 3269 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0436 Iteration 60, loss = 0.0141 Iteration 80, loss = 0.0084 --- Epoch 822 / 100000 - 3270 epochs total Iteration 0, loss = 0.0040 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0030 --- Epoch 823 / 100000 - 3271 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0013 Iteration 40, loss = 0.0228 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0101 --- Epoch 824 / 100000 - 3272 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0087 Iteration 40, loss = 0.0582 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0585 --- Epoch 825 / 100000 - 3273 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0259 Iteration 60, loss = 0.0119 Iteration 80, loss = 0.0052 --- Epoch 826 / 100000 - 3274 epochs total Iteration 0, loss = 0.0075 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0075 Iteration 60, loss = 0.0148 Iteration 80, loss = 0.0035 --- Epoch 827 / 100000 - 3275 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0219 Iteration 40, loss = 0.0182 Iteration 60, loss = 0.0286 Iteration 80, loss = 0.0753 --- Epoch 828 / 100000 - 3276 epochs total Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0089 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0030 --- Epoch 829 / 100000 - 3277 epochs total Iteration 0, loss = 0.0225 Iteration 20, loss = 0.0361 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0057 Iteration 80, loss = 0.0039 --- Epoch 830 / 100000 - 3278 epochs total Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0175 Iteration 40, loss = 0.0112 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0301 --- Epoch 831 / 100000 - 3279 epochs total Iteration 0, loss = 0.0426 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0025 Iteration 80, loss = 0.0173 --- Epoch 832 / 100000 - 3280 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0187 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0011 Iteration 80, loss = 0.0048 --- Epoch 833 / 100000 - 3281 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0313 Iteration 80, loss = 0.0061 --- Epoch 834 / 100000 - 3282 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0099 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0056 Iteration 80, loss = 0.0078 --- Epoch 835 / 100000 - 3283 epochs total Iteration 0, loss = 0.0039 Iteration 20, loss = 0.0216 Iteration 40, loss = 0.0121 Iteration 60, loss = 0.0043 Iteration 80, loss = 0.0041 --- Epoch 836 / 100000 - 3284 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0077 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0317 Iteration 80, loss = 0.0047 --- Epoch 837 / 100000 - 3285 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0148 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0135 --- Epoch 838 / 100000 - 3286 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0177 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0106 --- Epoch 839 / 100000 - 3287 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0087 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0093 Iteration 80, loss = 0.0053 --- Epoch 840 / 100000 - 3288 epochs total Iteration 0, loss = 0.0208 Iteration 20, loss = 0.0147 Iteration 40, loss = 0.0077 Iteration 60, loss = 0.0156 Iteration 80, loss = 0.0049 --- Epoch 841 / 100000 - 3289 epochs total Iteration 0, loss = 0.0499 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0081 --- Epoch 842 / 100000 - 3290 epochs total Iteration 0, loss = 0.0085 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0256 Iteration 60, loss = 0.0106 Iteration 80, loss = 0.0056 --- Epoch 843 / 100000 - 3291 epochs total Iteration 0, loss = 0.0088 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0036 Iteration 60, loss = 0.0028 Iteration 80, loss = 0.0433 --- Epoch 844 / 100000 - 3292 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0527 Iteration 40, loss = 0.0076 Iteration 60, loss = 0.0084 Iteration 80, loss = 0.0156 --- Epoch 845 / 100000 - 3293 epochs total Iteration 0, loss = 0.0344 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0106 Iteration 60, loss = 0.0147 Iteration 80, loss = 0.0023 --- Epoch 846 / 100000 - 3294 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0229 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0315 Iteration 80, loss = 0.0350 --- Epoch 847 / 100000 - 3295 epochs total Iteration 0, loss = 0.0049 Iteration 20, loss = 0.0044 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0061 --- Epoch 848 / 100000 - 3296 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0196 Iteration 40, loss = 0.0070 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0050 --- Epoch 849 / 100000 - 3297 epochs total Iteration 0, loss = 0.0046 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0014 --- Epoch 850 / 100000 - 3298 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0121 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0092 --- Epoch 851 / 100000 - 3299 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0074 Iteration 40, loss = 0.0047 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0041 --- Epoch 852 / 100000 - 3300 epochs total Iteration 0, loss = 0.0108 Iteration 20, loss = 0.0152 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0079 Iteration 80, loss = 0.0062 --- Epoch 853 / 100000 - 3301 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0112 Iteration 60, loss = 0.0455 Iteration 80, loss = 0.0024 --- Epoch 854 / 100000 - 3302 epochs total Iteration 0, loss = 0.0112 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0255 Iteration 80, loss = 0.0051 --- Epoch 855 / 100000 - 3303 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0057 --- Epoch 856 / 100000 - 3304 epochs total Iteration 0, loss = 0.0722 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0095 Iteration 80, loss = 0.0050 --- Epoch 857 / 100000 - 3305 epochs total Iteration 0, loss = 0.0128 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0309 --- Epoch 858 / 100000 - 3306 epochs total Iteration 0, loss = 0.0022 Iteration 20, loss = 0.0079 Iteration 40, loss = 0.0045 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0082 --- Epoch 859 / 100000 - 3307 epochs total Iteration 0, loss = 0.0128 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0020 --- Epoch 860 / 100000 - 3308 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0033 Iteration 40, loss = 0.0266 Iteration 60, loss = 0.0390 Iteration 80, loss = 0.0225 --- Epoch 861 / 100000 - 3309 epochs total Iteration 0, loss = 0.0098 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0112 --- Epoch 862 / 100000 - 3310 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0107 Iteration 80, loss = 0.0064 --- Epoch 863 / 100000 - 3311 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0286 Iteration 40, loss = 0.0132 Iteration 60, loss = 0.0241 Iteration 80, loss = 0.0191 --- Epoch 864 / 100000 - 3312 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0096 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0156 --- Epoch 865 / 100000 - 3313 epochs total Iteration 0, loss = 0.0125 Iteration 20, loss = 0.0099 Iteration 40, loss = 0.0017 Iteration 60, loss = 0.0017 Iteration 80, loss = 0.0012 --- Epoch 866 / 100000 - 3314 epochs total Iteration 0, loss = 0.0116 Iteration 20, loss = 0.0121 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0045 --- Epoch 867 / 100000 - 3315 epochs total Iteration 0, loss = 0.0176 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0375 Iteration 60, loss = 0.0189 Iteration 80, loss = 0.0081 --- Epoch 868 / 100000 - 3316 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0108 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0144 --- Epoch 869 / 100000 - 3317 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0154 Iteration 80, loss = 0.0031 --- Epoch 870 / 100000 - 3318 epochs total Iteration 0, loss = 0.0079 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0082 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0081 --- Epoch 871 / 100000 - 3319 epochs total Iteration 0, loss = 0.0236 Iteration 20, loss = 0.0035 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0295 Iteration 80, loss = 0.0060 --- Epoch 872 / 100000 - 3320 epochs total Iteration 0, loss = 0.0210 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0144 --- Epoch 873 / 100000 - 3321 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0019 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0022 --- Epoch 874 / 100000 - 3322 epochs total Iteration 0, loss = 0.0153 Iteration 20, loss = 0.0067 Iteration 40, loss = 0.0113 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0027 --- Epoch 875 / 100000 - 3323 epochs total Iteration 0, loss = 0.0107 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0388 Iteration 60, loss = 0.0051 Iteration 80, loss = 0.0019 --- Epoch 876 / 100000 - 3324 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0431 --- Epoch 877 / 100000 - 3325 epochs total Iteration 0, loss = 0.0020 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0193 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0011 --- Epoch 878 / 100000 - 3326 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0071 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0507 Iteration 80, loss = 0.0072 --- Epoch 879 / 100000 - 3327 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0113 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0168 --- Epoch 880 / 100000 - 3328 epochs total Iteration 0, loss = 0.0084 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0114 Iteration 80, loss = 0.0024 --- Epoch 881 / 100000 - 3329 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0056 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0080 --- Epoch 882 / 100000 - 3330 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0231 Iteration 80, loss = 0.0049 --- Epoch 883 / 100000 - 3331 epochs total Iteration 0, loss = 0.0265 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0012 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0033 --- Epoch 884 / 100000 - 3332 epochs total Iteration 0, loss = 0.0061 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0151 Iteration 80, loss = 0.0031 --- Epoch 885 / 100000 - 3333 epochs total Iteration 0, loss = 0.0089 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0023 Iteration 60, loss = 0.0149 Iteration 80, loss = 0.0098 --- Epoch 886 / 100000 - 3334 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0096 --- Epoch 887 / 100000 - 3335 epochs total Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0102 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0101 --- Epoch 888 / 100000 - 3336 epochs total Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0139 Iteration 40, loss = 0.0222 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0123 --- Epoch 889 / 100000 - 3337 epochs total Iteration 0, loss = 0.0164 Iteration 20, loss = 0.0308 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0044 Iteration 80, loss = 0.0042 --- Epoch 890 / 100000 - 3338 epochs total Iteration 0, loss = 0.0047 Iteration 20, loss = 0.0206 Iteration 40, loss = 0.0108 Iteration 60, loss = 0.0104 Iteration 80, loss = 0.0101 --- Epoch 891 / 100000 - 3339 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0124 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0134 Iteration 80, loss = 0.0115 --- Epoch 892 / 100000 - 3340 epochs total Iteration 0, loss = 0.0019 Iteration 20, loss = 0.0115 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0137 --- Epoch 893 / 100000 - 3341 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0025 --- Epoch 894 / 100000 - 3342 epochs total Iteration 0, loss = 0.0056 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0142 Iteration 60, loss = 0.0105 Iteration 80, loss = 0.0010 --- Epoch 895 / 100000 - 3343 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0580 --- Epoch 896 / 100000 - 3344 epochs total Iteration 0, loss = 0.0135 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0492 Iteration 60, loss = 0.0134 Iteration 80, loss = 0.0056 --- Epoch 897 / 100000 - 3345 epochs total Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0028 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0234 Iteration 80, loss = 0.0238 --- Epoch 898 / 100000 - 3346 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0076 Iteration 40, loss = 0.0026 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0036 --- Epoch 899 / 100000 - 3347 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0010 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0066 --- Epoch 900 / 100000 - 3348 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0012 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0029 Iteration 80, loss = 0.0024 --- Epoch 901 / 100000 - 3349 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0188 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0066 --- Epoch 902 / 100000 - 3350 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0042 --- Epoch 903 / 100000 - 3351 epochs total Iteration 0, loss = 0.0141 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0061 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0025 --- Epoch 904 / 100000 - 3352 epochs total Iteration 0, loss = 0.0153 Iteration 20, loss = 0.0147 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0108 --- Epoch 905 / 100000 - 3353 epochs total Iteration 0, loss = 0.0023 Iteration 20, loss = 0.0268 Iteration 40, loss = 0.0025 Iteration 60, loss = 0.0081 Iteration 80, loss = 0.0133 --- Epoch 906 / 100000 - 3354 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0066 Iteration 40, loss = 0.0106 Iteration 60, loss = 0.0133 Iteration 80, loss = 0.0032 --- Epoch 907 / 100000 - 3355 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0068 Iteration 80, loss = 0.0024 --- Epoch 908 / 100000 - 3356 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0722 Iteration 60, loss = 0.0011 Iteration 80, loss = 0.0017 --- Epoch 909 / 100000 - 3357 epochs total Iteration 0, loss = 0.0586 Iteration 20, loss = 0.0081 Iteration 40, loss = 0.0110 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0189 --- Epoch 910 / 100000 - 3358 epochs total Iteration 0, loss = 0.0128 Iteration 20, loss = 0.0128 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0053 Iteration 80, loss = 0.0051 --- Epoch 911 / 100000 - 3359 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0075 Iteration 40, loss = 0.0292 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0042 --- Epoch 912 / 100000 - 3360 epochs total Iteration 0, loss = 0.0015 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0369 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0075 --- Epoch 913 / 100000 - 3361 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0159 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0023 --- Epoch 914 / 100000 - 3362 epochs total Iteration 0, loss = 0.0053 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0101 Iteration 60, loss = 0.0168 Iteration 80, loss = 0.0040 --- Epoch 915 / 100000 - 3363 epochs total Iteration 0, loss = 0.0036 Iteration 20, loss = 0.0096 Iteration 40, loss = 0.0058 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0120 --- Epoch 916 / 100000 - 3364 epochs total Iteration 0, loss = 0.0204 Iteration 20, loss = 0.0183 Iteration 40, loss = 0.0087 Iteration 60, loss = 0.0100 Iteration 80, loss = 0.0230 --- Epoch 917 / 100000 - 3365 epochs total Iteration 0, loss = 0.0054 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0351 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0162 --- Epoch 918 / 100000 - 3366 epochs total Iteration 0, loss = 0.0225 Iteration 20, loss = 0.0113 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0189 Iteration 80, loss = 0.0012 --- Epoch 919 / 100000 - 3367 epochs total Iteration 0, loss = 0.0070 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0260 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0083 --- Epoch 920 / 100000 - 3368 epochs total Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0052 --- Epoch 921 / 100000 - 3369 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0226 Iteration 40, loss = 0.0097 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0043 --- Epoch 922 / 100000 - 3370 epochs total Iteration 0, loss = 0.0129 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0092 Iteration 60, loss = 0.0290 Iteration 80, loss = 0.0141 --- Epoch 923 / 100000 - 3371 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0149 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0043 --- Epoch 924 / 100000 - 3372 epochs total Iteration 0, loss = 0.0038 Iteration 20, loss = 0.0195 Iteration 40, loss = 0.0241 Iteration 60, loss = 0.0026 Iteration 80, loss = 0.0073 --- Epoch 925 / 100000 - 3373 epochs total Iteration 0, loss = 0.0192 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0670 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0041 --- Epoch 926 / 100000 - 3374 epochs total Iteration 0, loss = 0.0275 Iteration 20, loss = 0.0114 Iteration 40, loss = 0.0824 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0384 --- Epoch 927 / 100000 - 3375 epochs total Iteration 0, loss = 0.0138 Iteration 20, loss = 0.0186 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0014 Iteration 80, loss = 0.0072 --- Epoch 928 / 100000 - 3376 epochs total Iteration 0, loss = 0.0081 Iteration 20, loss = 0.0026 Iteration 40, loss = 0.0103 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0116 --- Epoch 929 / 100000 - 3377 epochs total Iteration 0, loss = 0.0093 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0062 --- Epoch 930 / 100000 - 3378 epochs total Iteration 0, loss = 0.0126 Iteration 20, loss = 0.0322 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0071 Iteration 80, loss = 0.0015 --- Epoch 931 / 100000 - 3379 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0070 Iteration 40, loss = 0.0018 Iteration 60, loss = 0.0078 Iteration 80, loss = 0.0069 --- Epoch 932 / 100000 - 3380 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0206 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0016 Iteration 80, loss = 0.0054 --- Epoch 933 / 100000 - 3381 epochs total Iteration 0, loss = 0.0143 Iteration 20, loss = 0.0348 Iteration 40, loss = 0.0083 Iteration 60, loss = 0.0066 Iteration 80, loss = 0.0087 --- Epoch 934 / 100000 - 3382 epochs total Iteration 0, loss = 0.0258 Iteration 20, loss = 0.0027 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0182 Iteration 80, loss = 0.0035 --- Epoch 935 / 100000 - 3383 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0111 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0045 Iteration 80, loss = 0.0045 --- Epoch 936 / 100000 - 3384 epochs total Iteration 0, loss = 0.0138 Iteration 20, loss = 0.0062 Iteration 40, loss = 0.0016 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0618 --- Epoch 937 / 100000 - 3385 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0054 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0152 Iteration 80, loss = 0.0069 --- Epoch 938 / 100000 - 3386 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0167 Iteration 60, loss = 0.0118 Iteration 80, loss = 0.0097 --- Epoch 939 / 100000 - 3387 epochs total Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0034 Iteration 40, loss = 0.0211 Iteration 60, loss = 0.0101 Iteration 80, loss = 0.0073 --- Epoch 940 / 100000 - 3388 epochs total Iteration 0, loss = 0.0106 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0044 Iteration 60, loss = 0.0059 Iteration 80, loss = 0.0136 --- Epoch 941 / 100000 - 3389 epochs total Iteration 0, loss = 0.0402 Iteration 20, loss = 0.0063 Iteration 40, loss = 0.0130 Iteration 60, loss = 0.0012 Iteration 80, loss = 0.0038 --- Epoch 942 / 100000 - 3390 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0118 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0074 Iteration 80, loss = 0.0030 --- Epoch 943 / 100000 - 3391 epochs total Iteration 0, loss = 0.0148 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0041 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0040 --- Epoch 944 / 100000 - 3392 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0180 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0046 --- Epoch 945 / 100000 - 3393 epochs total Iteration 0, loss = 0.0360 Iteration 20, loss = 0.0153 Iteration 40, loss = 0.0189 Iteration 60, loss = 0.0011 Iteration 80, loss = 0.0123 --- Epoch 946 / 100000 - 3394 epochs total Iteration 0, loss = 0.0821 Iteration 20, loss = 0.0014 Iteration 40, loss = 0.0105 Iteration 60, loss = 0.0087 Iteration 80, loss = 0.0065 --- Epoch 947 / 100000 - 3395 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0194 Iteration 40, loss = 0.0124 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0098 --- Epoch 948 / 100000 - 3396 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0160 Iteration 60, loss = 0.0271 Iteration 80, loss = 0.0117 --- Epoch 949 / 100000 - 3397 epochs total Iteration 0, loss = 0.0057 Iteration 20, loss = 0.0029 Iteration 40, loss = 0.0096 Iteration 60, loss = 0.0148 Iteration 80, loss = 0.0070 --- Epoch 950 / 100000 - 3398 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0111 Iteration 60, loss = 0.0024 Iteration 80, loss = 0.0014 --- Epoch 951 / 100000 - 3399 epochs total Iteration 0, loss = 0.0139 Iteration 20, loss = 0.0022 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0124 Iteration 80, loss = 0.0121 --- Epoch 952 / 100000 - 3400 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0228 Iteration 60, loss = 0.0214 Iteration 80, loss = 0.0119 --- Epoch 953 / 100000 - 3401 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0041 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0022 --- Epoch 954 / 100000 - 3402 epochs total Iteration 0, loss = 0.0016 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0020 Iteration 60, loss = 0.0063 Iteration 80, loss = 0.0151 --- Epoch 955 / 100000 - 3403 epochs total Iteration 0, loss = 0.0188 Iteration 20, loss = 0.0105 Iteration 40, loss = 0.0068 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0147 --- Epoch 956 / 100000 - 3404 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0101 Iteration 60, loss = 0.0140 Iteration 80, loss = 0.0068 --- Epoch 957 / 100000 - 3405 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0036 Iteration 80, loss = 0.0272 --- Epoch 958 / 100000 - 3406 epochs total Iteration 0, loss = 0.0067 Iteration 20, loss = 0.0313 Iteration 40, loss = 0.0371 Iteration 60, loss = 0.0102 Iteration 80, loss = 0.0048 --- Epoch 959 / 100000 - 3407 epochs total Iteration 0, loss = 0.0042 Iteration 20, loss = 0.0015 Iteration 40, loss = 0.0063 Iteration 60, loss = 0.0198 Iteration 80, loss = 0.0053 --- Epoch 960 / 100000 - 3408 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0069 Iteration 40, loss = 0.0039 Iteration 60, loss = 0.0020 Iteration 80, loss = 0.0040 --- Epoch 961 / 100000 - 3409 epochs total Iteration 0, loss = 0.0055 Iteration 20, loss = 0.0148 Iteration 40, loss = 0.0098 Iteration 60, loss = 0.0030 Iteration 80, loss = 0.0037 --- Epoch 962 / 100000 - 3410 epochs total Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0141 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0059 --- Epoch 963 / 100000 - 3411 epochs total Iteration 0, loss = 0.0027 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0061 Iteration 80, loss = 0.0228 --- Epoch 964 / 100000 - 3412 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0021 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0270 Iteration 80, loss = 0.0102 --- Epoch 965 / 100000 - 3413 epochs total Iteration 0, loss = 0.0060 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0054 Iteration 80, loss = 0.0119 --- Epoch 966 / 100000 - 3414 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0107 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0088 --- Epoch 967 / 100000 - 3415 epochs total Iteration 0, loss = 0.0324 Iteration 20, loss = 0.0040 Iteration 40, loss = 0.0565 Iteration 60, loss = 0.0069 Iteration 80, loss = 0.0097 --- Epoch 968 / 100000 - 3416 epochs total Iteration 0, loss = 0.0127 Iteration 20, loss = 0.0024 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0172 Iteration 80, loss = 0.0362 --- Epoch 969 / 100000 - 3417 epochs total Iteration 0, loss = 0.0119 Iteration 20, loss = 0.0059 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0035 --- Epoch 970 / 100000 - 3418 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0178 Iteration 40, loss = 0.0035 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0076 --- Epoch 971 / 100000 - 3419 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0042 Iteration 40, loss = 0.0079 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0056 --- Epoch 972 / 100000 - 3420 epochs total Iteration 0, loss = 0.0127 Iteration 20, loss = 0.0116 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0147 Iteration 80, loss = 0.0207 --- Epoch 973 / 100000 - 3421 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0046 Iteration 40, loss = 0.0049 Iteration 60, loss = 0.0080 Iteration 80, loss = 0.0021 --- Epoch 974 / 100000 - 3422 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0058 Iteration 40, loss = 0.0029 Iteration 60, loss = 0.0023 Iteration 80, loss = 0.0083 --- Epoch 975 / 100000 - 3423 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0053 Iteration 40, loss = 0.0009 Iteration 60, loss = 0.0264 Iteration 80, loss = 0.0042 --- Epoch 976 / 100000 - 3424 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0078 Iteration 60, loss = 0.0133 Iteration 80, loss = 0.0088 --- Epoch 977 / 100000 - 3425 epochs total Iteration 0, loss = 0.0073 Iteration 20, loss = 0.0299 Iteration 40, loss = 0.0142 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0108 --- Epoch 978 / 100000 - 3426 epochs total Iteration 0, loss = 0.0028 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0207 Iteration 80, loss = 0.0235 --- Epoch 979 / 100000 - 3427 epochs total Iteration 0, loss = 0.0170 Iteration 20, loss = 0.0057 Iteration 40, loss = 0.0416 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0027 --- Epoch 980 / 100000 - 3428 epochs total Iteration 0, loss = 0.0021 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0238 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0067 --- Epoch 981 / 100000 - 3429 epochs total Iteration 0, loss = 0.0123 Iteration 20, loss = 0.0247 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0102 Iteration 80, loss = 0.0089 --- Epoch 982 / 100000 - 3430 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0028 Iteration 60, loss = 0.0281 Iteration 80, loss = 0.0031 --- Epoch 983 / 100000 - 3431 epochs total Iteration 0, loss = 0.0010 Iteration 20, loss = 0.0101 Iteration 40, loss = 0.0086 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0149 --- Epoch 984 / 100000 - 3432 epochs total Iteration 0, loss = 0.0044 Iteration 20, loss = 0.0106 Iteration 40, loss = 0.0030 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0116 --- Epoch 985 / 100000 - 3433 epochs total Iteration 0, loss = 0.0187 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0108 Iteration 60, loss = 0.0345 Iteration 80, loss = 0.0039 --- Epoch 986 / 100000 - 3434 epochs total Iteration 0, loss = 0.0026 Iteration 20, loss = 0.0164 Iteration 40, loss = 0.0092 Iteration 60, loss = 0.0180 Iteration 80, loss = 0.0123 --- Epoch 987 / 100000 - 3435 epochs total Iteration 0, loss = 0.0187 Iteration 20, loss = 0.0055 Iteration 40, loss = 0.0032 Iteration 60, loss = 0.0097 Iteration 80, loss = 0.0321 --- Epoch 988 / 100000 - 3436 epochs total Iteration 0, loss = 0.0096 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0083 Iteration 80, loss = 0.0054 --- Epoch 989 / 100000 - 3437 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0973 --- Epoch 990 / 100000 - 3438 epochs total Iteration 0, loss = 0.0213 Iteration 20, loss = 0.0088 Iteration 40, loss = 0.0022 Iteration 60, loss = 0.0240 Iteration 80, loss = 0.0207 --- Epoch 991 / 100000 - 3439 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0123 Iteration 40, loss = 0.0034 Iteration 60, loss = 0.0048 Iteration 80, loss = 0.0045 --- Epoch 992 / 100000 - 3440 epochs total Iteration 0, loss = 0.0050 Iteration 20, loss = 0.0068 Iteration 40, loss = 0.0197 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0062 --- Epoch 993 / 100000 - 3441 epochs total Iteration 0, loss = 0.0249 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0129 Iteration 60, loss = 0.0065 Iteration 80, loss = 0.0192 --- Epoch 994 / 100000 - 3442 epochs total Iteration 0, loss = 0.0030 Iteration 20, loss = 0.0100 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0039 --- Epoch 995 / 100000 - 3443 epochs total Iteration 0, loss = 0.0058 Iteration 20, loss = 0.0080 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0162 Iteration 80, loss = 0.0034 --- Epoch 996 / 100000 - 3444 epochs total Iteration 0, loss = 0.0065 Iteration 20, loss = 0.0189 Iteration 40, loss = 0.0069 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0068 --- Epoch 997 / 100000 - 3445 epochs total Iteration 0, loss = 0.0124 Iteration 20, loss = 0.0010 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0063 --- Epoch 998 / 100000 - 3446 epochs total Iteration 0, loss = 0.0416 Iteration 20, loss = 0.0546 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0077 Iteration 80, loss = 0.0558 --- Epoch 999 / 100000 - 3447 epochs total Iteration 0, loss = 0.0012 Iteration 20, loss = 0.0353 Iteration 40, loss = 0.0040 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0123 --- Epoch 1000 / 100000 - 3448 epochs total Iteration 0, loss = 0.0066 Iteration 20, loss = 0.0052 Iteration 40, loss = 0.0056 Iteration 60, loss = 0.0141 Iteration 80, loss = 0.0046 --- Epoch 1001 / 100000 - 3449 epochs total Iteration 0, loss = 0.0129 Iteration 20, loss = 0.0096 Iteration 40, loss = 0.0118 Iteration 60, loss = 0.0295 Iteration 80, loss = 0.0140 --- Epoch 1002 / 100000 - 3450 epochs total Iteration 0, loss = 0.0446 Iteration 20, loss = 0.0032 Iteration 40, loss = 0.0062 Iteration 60, loss = 0.0019 Iteration 80, loss = 0.0172 --- Epoch 1003 / 100000 - 3451 epochs total Iteration 0, loss = 0.0024 Iteration 20, loss = 0.0018 Iteration 40, loss = 0.0013 Iteration 60, loss = 0.0083 Iteration 80, loss = 0.0054 --- Epoch 1004 / 100000 - 3452 epochs total Iteration 0, loss = 0.0029 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0033 Iteration 60, loss = 0.0033 Iteration 80, loss = 0.0150 --- Epoch 1005 / 100000 - 3453 epochs total Iteration 0, loss = 0.0037 Iteration 20, loss = 0.0135 Iteration 40, loss = 0.0160 Iteration 60, loss = 0.0039 Iteration 80, loss = 0.0054 --- Epoch 1006 / 100000 - 3454 epochs total Iteration 0, loss = 0.0017 Iteration 20, loss = 0.0017 Iteration 40, loss = 0.0067 Iteration 60, loss = 0.0042 Iteration 80, loss = 0.0112 --- Epoch 1007 / 100000 - 3455 epochs total Iteration 0, loss = 0.0113 Iteration 20, loss = 0.0466 Iteration 40, loss = 0.0091 Iteration 60, loss = 0.0047 Iteration 80, loss = 0.0131 --- Epoch 1008 / 100000 - 3456 epochs total Iteration 0, loss = 0.0110 Iteration 20, loss = 0.0072 Iteration 40, loss = 0.0107 Iteration 60, loss = 0.0129 Iteration 80, loss = 0.0067 --- Epoch 1009 / 100000 - 3457 epochs total Iteration 0, loss = 0.0085 Iteration 20, loss = 0.0019 Iteration 40, loss = 0.0178 Iteration 60, loss = 0.0101 Iteration 80, loss = 0.0169 --- Epoch 1010 / 100000 - 3458 epochs total Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0125 Iteration 40, loss = 0.0065 Iteration 60, loss = 0.0058 Iteration 80, loss = 0.0063 --- Epoch 1011 / 100000 - 3459 epochs total Iteration 0, loss = 0.0129 Iteration 20, loss = 0.0016 Iteration 40, loss = 0.0054 Iteration 60, loss = 0.0027 Iteration 80, loss = 0.0082 --- Epoch 1012 / 100000 - 3460 epochs total Iteration 0, loss = 0.0041 Iteration 20, loss = 0.0037 Iteration 40, loss = 0.0072 Iteration 60, loss = 0.0132 Iteration 80, loss = 0.0255 --- Epoch 1013 / 100000 - 3461 epochs total Iteration 0, loss = 0.0214 Iteration 20, loss = 0.0045 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0090 Iteration 80, loss = 0.0095 --- Epoch 1014 / 100000 - 3462 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0130 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0142 Iteration 80, loss = 0.0050 --- Epoch 1015 / 100000 - 3463 epochs total Iteration 0, loss = 0.0064 Iteration 20, loss = 0.0085 Iteration 40, loss = 0.0115 Iteration 60, loss = 0.0060 Iteration 80, loss = 0.0077 --- Epoch 1016 / 100000 - 3464 epochs total Iteration 0, loss = 0.0034 Iteration 20, loss = 0.0281 Iteration 40, loss = 0.0055 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0027 --- Epoch 1017 / 100000 - 3465 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0100 Iteration 60, loss = 0.0124 Iteration 80, loss = 0.0250 --- Epoch 1018 / 100000 - 3466 epochs total Iteration 0, loss = 0.0032 Iteration 20, loss = 0.0038 Iteration 40, loss = 0.0110 Iteration 60, loss = 0.0127 Iteration 80, loss = 0.0160 --- Epoch 1019 / 100000 - 3467 epochs total Iteration 0, loss = 0.0102 Iteration 20, loss = 0.0061 Iteration 40, loss = 0.0043 Iteration 60, loss = 0.0177 Iteration 80, loss = 0.0135 --- Epoch 1020 / 100000 - 3468 epochs total Iteration 0, loss = 0.0148 Iteration 20, loss = 0.0060 Iteration 40, loss = 0.0204 Iteration 60, loss = 0.0179 Iteration 80, loss = 0.0055 --- Epoch 1021 / 100000 - 3469 epochs total Iteration 0, loss = 0.0059 Iteration 20, loss = 0.0030 Iteration 40, loss = 0.0093 Iteration 60, loss = 0.0032 Iteration 80, loss = 0.0046 --- Epoch 1022 / 100000 - 3470 epochs total Iteration 0, loss = 0.0199 Iteration 20, loss = 0.0025 Iteration 40, loss = 0.0042 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0054 --- Epoch 1023 / 100000 - 3471 epochs total Iteration 0, loss = 0.0068 Iteration 20, loss = 0.0145 Iteration 40, loss = 0.0052 Iteration 60, loss = 0.0076 Iteration 80, loss = 0.0108 --- Epoch 1024 / 100000 - 3472 epochs total Iteration 0, loss = 0.0043 Iteration 20, loss = 0.0011 Iteration 40, loss = 0.0064 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0072 --- Epoch 1025 / 100000 - 3473 epochs total Iteration 0, loss = 0.0142 Iteration 20, loss = 0.0098 Iteration 40, loss = 0.0638 Iteration 60, loss = 0.0075 Iteration 80, loss = 0.0031 --- Epoch 1026 / 100000 - 3474 epochs total Iteration 0, loss = 0.0183 Iteration 20, loss = 0.0047 Iteration 40, loss = 0.0134 Iteration 60, loss = 0.0067 Iteration 80, loss = 0.0049 --- Epoch 1027 / 100000 - 3475 epochs total Iteration 0, loss = 0.0158 Iteration 20, loss = 0.0092 Iteration 40, loss = 0.0024 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0073 --- Epoch 1028 / 100000 - 3476 epochs total Iteration 0, loss = 0.0174 Iteration 20, loss = 0.0043 Iteration 40, loss = 0.0189 Iteration 60, loss = 0.0049 Iteration 80, loss = 0.0059 --- Epoch 1029 / 100000 - 3477 epochs total Iteration 0, loss = 0.0045 Iteration 20, loss = 0.0339 Iteration 40, loss = 0.0187 Iteration 60, loss = 0.0109 Iteration 80, loss = 0.0478 --- Epoch 1030 / 100000 - 3478 epochs total Iteration 0, loss = 0.0225 Iteration 20, loss = 0.0031 Iteration 40, loss = 0.0046 Iteration 60, loss = 0.0088 Iteration 80, loss = 0.0044 --- Epoch 1031 / 100000 - 3479 epochs total Iteration 0, loss = 0.0282 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0181 Iteration 80, loss = 0.0140 --- Epoch 1032 / 100000 - 3480 epochs total Iteration 0, loss = 0.0035 Iteration 20, loss = 0.0142 Iteration 40, loss = 0.0208 Iteration 60, loss = 0.0114 Iteration 80, loss = 0.0017 --- Epoch 1033 / 100000 - 3481 epochs total Iteration 0, loss = 0.0120 Iteration 20, loss = 0.0110 Iteration 40, loss = 0.0015 Iteration 60, loss = 0.0192 Iteration 80, loss = 0.0161 --- Epoch 1034 / 100000 - 3482 epochs total Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0372 Iteration 40, loss = 0.0060 Iteration 60, loss = 0.0034 Iteration 80, loss = 0.0494 --- Epoch 1035 / 100000 - 3483 epochs total Iteration 0, loss = 0.0031 Iteration 20, loss = 0.0039 Iteration 40, loss = 0.0178 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0050 --- Epoch 1036 / 100000 - 3484 epochs total Iteration 0, loss = 0.0158 Iteration 20, loss = 0.0117 Iteration 40, loss = 0.0125 Iteration 60, loss = 0.0038 Iteration 80, loss = 0.0041 --- Epoch 1037 / 100000 - 3485 epochs total Iteration 0, loss = 0.0233 Iteration 20, loss = 0.0123 Iteration 40, loss = 0.0021 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0320 --- Epoch 1038 / 100000 - 3486 epochs total Iteration 0, loss = 0.0014 Iteration 20, loss = 0.0131 Iteration 40, loss = 0.0038 Iteration 60, loss = 0.0031 Iteration 80, loss = 0.0027 --- Epoch 1039 / 100000 - 3487 epochs total Iteration 0, loss = 0.0180 Iteration 20, loss = 0.0020 Iteration 40, loss = 0.0272 Iteration 60, loss = 0.0021 Iteration 80, loss = 0.0257 --- Epoch 1040 / 100000 - 3488 epochs total Iteration 0, loss = 0.0080 Iteration 20, loss = 0.0048 Iteration 40, loss = 0.0117 Iteration 60, loss = 0.0040 Iteration 80, loss = 0.0066 --- Epoch 1041 / 100000 - 3489 epochs total Iteration 0, loss = 0.0025 Iteration 20, loss = 0.0023 Iteration 40, loss = 0.0037 Iteration 60, loss = 0.0092 Iteration 80, loss = 0.0087 --- Epoch 1042 / 100000 - 3490 epochs total Iteration 0, loss = 0.0078 Iteration 20, loss = 0.0051 Iteration 40, loss = 0.0446 Iteration 60, loss = 0.0052 Iteration 80, loss = 0.0070 --- Epoch 1043 / 100000 - 3491 epochs total Iteration 0, loss = 0.0389 Iteration 20, loss = 0.0149 Iteration 40, loss = 0.0057 Iteration 60, loss = 0.0240 Iteration 80, loss = 0.0079 --- Epoch 1044 / 100000 - 3492 epochs total Iteration 0, loss = 0.0087 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0048 Iteration 60, loss = 0.0046 Iteration 80, loss = 0.0066 --- Epoch 1045 / 100000 - 3493 epochs total Iteration 0, loss = 0.0155 Iteration 20, loss = 0.0083 Iteration 40, loss = 0.0073 Iteration 60, loss = 0.0022 Iteration 80, loss = 0.0115 --- Epoch 1046 / 100000 - 3494 epochs total Iteration 0, loss = 0.0206 Iteration 20, loss = 0.0274 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0694 Iteration 80, loss = 0.0032 --- Epoch 1047 / 100000 - 3495 epochs total Iteration 0, loss = 0.0063 Iteration 20, loss = 0.0073 Iteration 40, loss = 0.0137 Iteration 60, loss = 0.0050 Iteration 80, loss = 0.0056 --- Epoch 1048 / 100000 - 3496 epochs total Iteration 0, loss = 0.0114 Iteration 20, loss = 0.0225 Iteration 40, loss = 0.0014 Iteration 60, loss = 0.0086 Iteration 80, loss = 0.0084 --- Epoch 1049 / 100000 - 3497 epochs total Iteration 0, loss = 0.0099 Iteration 20, loss = 0.0331 Iteration 40, loss = 0.0239 Iteration 60, loss = 0.0113 Iteration 80, loss = 0.0482 --- Epoch 1050 / 100000 - 3498 epochs total Iteration 0, loss = 0.0076 Iteration 20, loss = 0.0328 Iteration 40, loss = 0.0095 Iteration 60, loss = 0.0157 Iteration 80, loss = 0.0235 --- Epoch 1051 / 100000 - 3499 epochs total Iteration 0, loss = 0.0118 Iteration 20, loss = 0.0093 Iteration 40, loss = 0.0080 Iteration 60, loss = 0.0035 Iteration 80, loss = 0.0107 --- Epoch 1052 / 100000 - 3500 epochs total Iteration 0, loss = 0.0083 Iteration 20, loss = 0.0104 Iteration 40, loss = 0.0050 Iteration 60, loss = 0.0475 Iteration 80, loss = 0.0050
--------------------------------------------------------------------------- KeyboardInterrupt Traceback (most recent call last) <ipython-input-161-ca87b0d12256> in <module> ----> 1 train(model14, optimizer, epochs=100000, x_train=data["X_train"], y_train=data["y_train"], criterion=nn.MSELoss()) <ipython-input-18-95dee9c67ab2> in train(model, optimizer, epochs, x_train, y_train, criterion) 34 # Zero out all of the gradients for the variables which the optimizer 35 # will update. ---> 36 optimizer.zero_grad() 37 38 # This is the backwards pass: compute the gradient of the loss with /opt/anaconda3/envs/cs682/lib/python3.6/site-packages/torch/optim/optimizer.py in zero_grad(self) 170 if p.grad is not None: 171 p.grad.detach_() --> 172 p.grad.zero_() 173 174 def step(self, closure): KeyboardInterrupt:
testModel(model14, x_test=data["X_test"], y_test=data["y_test"], criterion=nn.MSELoss())